ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/IO-AIO/AIO.xs
(Generate patch)

Comparing IO-AIO/AIO.xs (file contents):
Revision 1.70 by root, Tue Oct 24 15:15:56 2006 UTC vs.
Revision 1.85 by root, Sat Oct 28 23:32:29 2006 UTC

1/* solaris */ 1/* solaris */
2#define _POSIX_PTHREAD_SEMANTICS 1 2#define _POSIX_PTHREAD_SEMANTICS 1
3 3
4#if __linux 4#if __linux && !defined(_GNU_SOURCE)
5# define _GNU_SOURCE 5# define _GNU_SOURCE
6#endif 6#endif
7 7
8/* just in case */
8#define _REENTRANT 1 9#define _REENTRANT 1
9 10
10#include <errno.h> 11#include <errno.h>
11 12
12#include "EXTERN.h" 13#include "EXTERN.h"
42# else 43# else
43# error sendfile support requested but not available 44# error sendfile support requested but not available
44# endif 45# endif
45#endif 46#endif
46 47
48/* number of seconds after which idle threads exit */
49#define IDLE_TIMEOUT 10
50
47/* used for struct dirent, AIX doesn't provide it */ 51/* used for struct dirent, AIX doesn't provide it */
48#ifndef NAME_MAX 52#ifndef NAME_MAX
49# define NAME_MAX 4096 53# define NAME_MAX 4096
54#endif
55
56#ifndef PTHREAD_STACK_MIN
57/* care for broken platforms, e.g. windows */
58# define PTHREAD_STACK_MIN 16384
50#endif 59#endif
51 60
52#if __ia64 61#if __ia64
53# define STACKSIZE 65536 62# define STACKSIZE 65536
54#elif __i386 || __x86_64 /* 16k is unreasonably high :( */ 63#elif __i386 || __x86_64 /* 16k is unreasonably high :( */
55# define STACKSIZE PTHREAD_STACK_MIN 64# define STACKSIZE PTHREAD_STACK_MIN
56#else 65#else
57# define STACKSIZE 16384 66# define STACKSIZE 16384
58#endif 67#endif
59 68
69/* wether word reads are potentially non-atomic.
70 * this is conservatice, likely most arches this runs
71 * on have atomic word read/writes.
72 */
73#ifndef WORDACCESS_UNSAFE
74# if __i386 || __x86_64
75# define WORDACCESS_UNSAFE 0
76# else
77# define WORDACCESS_UNSAFE 1
78# endif
79#endif
80
60/* buffer size for various temporary buffers */ 81/* buffer size for various temporary buffers */
61#define AIO_BUFSIZE 65536 82#define AIO_BUFSIZE 65536
62 83
63#define dBUF \ 84#define dBUF \
85 char *aio_buf; \
86 LOCK (wrklock); \
64 char *aio_buf = malloc (AIO_BUFSIZE); \ 87 self->dbuf = aio_buf = malloc (AIO_BUFSIZE); \
88 UNLOCK (wrklock); \
65 if (!aio_buf) \ 89 if (!aio_buf) \
66 return -1; 90 return -1;
67
68#define fBUF free (aio_buf)
69 91
70enum { 92enum {
71 REQ_QUIT, 93 REQ_QUIT,
72 REQ_OPEN, REQ_CLOSE, 94 REQ_OPEN, REQ_CLOSE,
73 REQ_READ, REQ_WRITE, REQ_READAHEAD, 95 REQ_READ, REQ_WRITE, REQ_READAHEAD,
74 REQ_SENDFILE, 96 REQ_SENDFILE,
75 REQ_STAT, REQ_LSTAT, REQ_FSTAT, 97 REQ_STAT, REQ_LSTAT, REQ_FSTAT,
76 REQ_FSYNC, REQ_FDATASYNC, 98 REQ_FSYNC, REQ_FDATASYNC,
77 REQ_UNLINK, REQ_RMDIR, REQ_RENAME, 99 REQ_UNLINK, REQ_RMDIR, REQ_RENAME,
78 REQ_READDIR, 100 REQ_MKNOD, REQ_READDIR,
79 REQ_LINK, REQ_SYMLINK, 101 REQ_LINK, REQ_SYMLINK,
80 REQ_GROUP, REQ_NOP, 102 REQ_GROUP, REQ_NOP,
81 REQ_BUSY, 103 REQ_BUSY,
82}; 104};
83 105
123 DEFAULT_PRI = 0, 145 DEFAULT_PRI = 0,
124 PRI_BIAS = -PRI_MIN, 146 PRI_BIAS = -PRI_MIN,
125 NUM_PRI = PRI_MAX + PRI_BIAS + 1, 147 NUM_PRI = PRI_MAX + PRI_BIAS + 1,
126}; 148};
127 149
150#define AIO_TICKS ((1000000 + 1023) >> 10)
151
152static unsigned int max_poll_time = 0;
153static unsigned int max_poll_reqs = 0;
154
155/* calculcate time difference in ~1/AIO_TICKS of a second */
156static int tvdiff (struct timeval *tv1, struct timeval *tv2)
157{
158 return (tv2->tv_sec - tv1->tv_sec ) * AIO_TICKS
159 + ((tv2->tv_usec - tv1->tv_usec) >> 10);
160}
161
128static int next_pri = DEFAULT_PRI + PRI_BIAS; 162static int next_pri = DEFAULT_PRI + PRI_BIAS;
129 163
130static int started, wanted; 164static unsigned int started, idle, wanted;
131static volatile int nreqs;
132static int max_outstanding = 1<<30;
133static int respipe [2];
134 165
135#if __linux && defined (PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP) 166#if __linux && defined (PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP)
136# define AIO_MUTEX_INIT PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP 167# define AIO_MUTEX_INIT PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP
137#else 168#else
138# define AIO_MUTEX_INIT PTHREAD_MUTEX_INITIALIZER 169# define AIO_MUTEX_INIT PTHREAD_MUTEX_INITIALIZER
139#endif 170#endif
140 171
172#define LOCK(mutex) pthread_mutex_lock (&(mutex))
173#define UNLOCK(mutex) pthread_mutex_unlock (&(mutex))
174
175/* worker threads management */
176static pthread_mutex_t wrklock = AIO_MUTEX_INIT;
177
178typedef struct worker {
179 /* locked by wrklock */
180 struct worker *prev, *next;
181
182 pthread_t tid;
183
184 /* locked by reslock, reqlock or wrklock */
185 aio_req req; /* currently processed request */
186 void *dbuf;
187 DIR *dirp;
188} worker;
189
190static worker wrk_first = { &wrk_first, &wrk_first, 0 };
191
192static void worker_clear (worker *wrk)
193{
194 if (wrk->dirp)
195 {
196 closedir (wrk->dirp);
197 wrk->dirp = 0;
198 }
199
200 if (wrk->dbuf)
201 {
202 free (wrk->dbuf);
203 wrk->dbuf = 0;
204 }
205}
206
207static void worker_free (worker *wrk)
208{
209 wrk->next->prev = wrk->prev;
210 wrk->prev->next = wrk->next;
211
212 free (wrk);
213}
214
215static volatile unsigned int nreqs, nready, npending;
216static volatile unsigned int max_idle = 4;
217static volatile unsigned int max_outstanding = 0xffffffff;
218static int respipe [2];
219
141static pthread_mutex_t reslock = AIO_MUTEX_INIT; 220static pthread_mutex_t reslock = AIO_MUTEX_INIT;
142static pthread_mutex_t reqlock = AIO_MUTEX_INIT; 221static pthread_mutex_t reqlock = AIO_MUTEX_INIT;
143static pthread_cond_t reqwait = PTHREAD_COND_INITIALIZER; 222static pthread_cond_t reqwait = PTHREAD_COND_INITIALIZER;
223
224#if WORDACCESS_UNSAFE
225
226static unsigned int get_nready ()
227{
228 unsigned int retval;
229
230 LOCK (reqlock);
231 retval = nready;
232 UNLOCK (reqlock);
233
234 return retval;
235}
236
237static unsigned int get_npending ()
238{
239 unsigned int retval;
240
241 LOCK (reslock);
242 retval = npending;
243 UNLOCK (reslock);
244
245 return retval;
246}
247
248static unsigned int get_nthreads ()
249{
250 unsigned int retval;
251
252 LOCK (wrklock);
253 retval = started;
254 UNLOCK (wrklock);
255
256 return retval;
257}
258
259#else
260
261# define get_nready() nready
262# define get_npending() npending
263# define get_nthreads() started
264
265#endif
144 266
145/* 267/*
146 * a somewhat faster data structure might be nice, but 268 * a somewhat faster data structure might be nice, but
147 * with 8 priorities this actually needs <20 insns 269 * with 8 priorities this actually needs <20 insns
148 * per shift, the most expensive operation. 270 * per shift, the most expensive operation.
194 } 316 }
195 317
196 abort (); 318 abort ();
197} 319}
198 320
321static int poll_cb ();
199static void req_invoke (aio_req req); 322static void req_invoke (aio_req req);
200static void req_free (aio_req req); 323static void req_free (aio_req req);
324static void req_cancel (aio_req req);
201 325
202/* must be called at most once */ 326/* must be called at most once */
203static SV *req_sv (aio_req req, const char *klass) 327static SV *req_sv (aio_req req, const char *klass)
204{ 328{
205 if (!req->self) 329 if (!req->self)
267 req_invoke (grp); 391 req_invoke (grp);
268 req_free (grp); 392 req_free (grp);
269 } 393 }
270} 394}
271 395
272static void poll_wait ()
273{
274 fd_set rfd;
275
276 while (nreqs)
277 {
278 int size;
279#if !(__i386 || __x86_64) /* safe without sempahore on this archs */
280 pthread_mutex_lock (&reslock);
281#endif
282 size = res_queue.size;
283#if !(__i386 || __x86_64) /* safe without sempahore on this archs */
284 pthread_mutex_unlock (&reslock);
285#endif
286
287 if (size)
288 return;
289
290 FD_ZERO(&rfd);
291 FD_SET(respipe [0], &rfd);
292
293 select (respipe [0] + 1, &rfd, 0, 0, 0);
294 }
295}
296
297static void req_invoke (aio_req req) 396static void req_invoke (aio_req req)
298{ 397{
299 dSP; 398 dSP;
300 399
301 if (!(req->flags & FLAG_CANCELLED) && SvOK (req->callback)) 400 if (!(req->flags & FLAG_CANCELLED) && SvOK (req->callback))
302 { 401 {
303 errno = req->errorno;
304
305 ENTER; 402 ENTER;
306 SAVETMPS; 403 SAVETMPS;
307 PUSHMARK (SP); 404 PUSHMARK (SP);
308 EXTEND (SP, 1); 405 EXTEND (SP, 1);
309 406
313 { 410 {
314 SV *rv = &PL_sv_undef; 411 SV *rv = &PL_sv_undef;
315 412
316 if (req->result >= 0) 413 if (req->result >= 0)
317 { 414 {
415 int i;
318 char *buf = req->data2ptr; 416 char *buf = req->data2ptr;
319 AV *av = newAV (); 417 AV *av = newAV ();
320 418
321 while (req->result) 419 av_extend (av, req->result - 1);
420
421 for (i = 0; i < req->result; ++i)
322 { 422 {
323 SV *sv = newSVpv (buf, 0); 423 SV *sv = newSVpv (buf, 0);
324 424
325 av_push (av, sv); 425 av_store (av, i, sv);
326 buf += SvCUR (sv) + 1; 426 buf += SvCUR (sv) + 1;
327 req->result--;
328 } 427 }
329 428
330 rv = sv_2mortal (newRV_noinc ((SV *)av)); 429 rv = sv_2mortal (newRV_noinc ((SV *)av));
331 } 430 }
332 431
372 default: 471 default:
373 PUSHs (sv_2mortal (newSViv (req->result))); 472 PUSHs (sv_2mortal (newSViv (req->result)));
374 break; 473 break;
375 } 474 }
376 475
476 errno = req->errorno;
377 477
378 PUTBACK; 478 PUTBACK;
379 call_sv (req->callback, G_VOID | G_EVAL); 479 call_sv (req->callback, G_VOID | G_EVAL);
380 SPAGAIN; 480 SPAGAIN;
381 481
416 SvREFCNT_dec (req->fh); 516 SvREFCNT_dec (req->fh);
417 SvREFCNT_dec (req->fh2); 517 SvREFCNT_dec (req->fh2);
418 SvREFCNT_dec (req->callback); 518 SvREFCNT_dec (req->callback);
419 Safefree (req->statdata); 519 Safefree (req->statdata);
420 520
421 if (req->type == REQ_READDIR && req->result >= 0) 521 if (req->type == REQ_READDIR)
422 free (req->data2ptr); 522 free (req->data2ptr);
423 523
424 Safefree (req); 524 Safefree (req);
425} 525}
426 526
527static void req_cancel_subs (aio_req grp)
528{
529 aio_req sub;
530
531 if (grp->type != REQ_GROUP)
532 return;
533
534 SvREFCNT_dec (grp->fh2);
535 grp->fh2 = 0;
536
537 for (sub = grp->grp_first; sub; sub = sub->grp_next)
538 req_cancel (sub);
539}
540
427static void req_cancel (aio_req req) 541static void req_cancel (aio_req req)
428{ 542{
429 req->flags |= FLAG_CANCELLED; 543 req->flags |= FLAG_CANCELLED;
430 544
431 if (req->type == REQ_GROUP) 545 req_cancel_subs (req);
432 {
433 aio_req sub;
434
435 for (sub = req->grp_first; sub; sub = sub->grp_next)
436 req_cancel (sub);
437 }
438}
439
440static int poll_cb ()
441{
442 dSP;
443 int count = 0;
444 int do_croak = 0;
445 aio_req req;
446
447 for (;;)
448 {
449 pthread_mutex_lock (&reslock);
450 req = reqq_shift (&res_queue);
451
452 if (req)
453 {
454 if (!res_queue.size)
455 {
456 /* read any signals sent by the worker threads */
457 char buf [32];
458 while (read (respipe [0], buf, 32) == 32)
459 ;
460 }
461 }
462
463 pthread_mutex_unlock (&reslock);
464
465 if (!req)
466 break;
467
468 --nreqs;
469
470 if (req->type == REQ_QUIT)
471 started--;
472 else if (req->type == REQ_GROUP && req->length)
473 {
474 req->fd = 1; /* mark request as delayed */
475 continue;
476 }
477 else
478 {
479 if (req->type == REQ_READ)
480 SvCUR_set (req->data, req->dataoffset + (req->result > 0 ? req->result : 0));
481
482 if (req->data2ptr && (req->type == REQ_READ || req->type == REQ_WRITE))
483 SvREADONLY_off (req->data);
484
485 if (req->statdata)
486 {
487 PL_laststype = req->type == REQ_LSTAT ? OP_LSTAT : OP_STAT;
488 PL_laststatval = req->result;
489 PL_statcache = *(req->statdata);
490 }
491
492 req_invoke (req);
493
494 count++;
495 }
496
497 req_free (req);
498 }
499
500 return count;
501} 546}
502 547
503static void *aio_proc(void *arg); 548static void *aio_proc(void *arg);
504 549
505static void start_thread (void) 550static void start_thread (void)
506{ 551{
507 sigset_t fullsigset, oldsigset; 552 sigset_t fullsigset, oldsigset;
508 pthread_t tid;
509 pthread_attr_t attr; 553 pthread_attr_t attr;
554
555 worker *wrk = calloc (1, sizeof (worker));
556
557 if (!wrk)
558 croak ("unable to allocate worker thread data");
510 559
511 pthread_attr_init (&attr); 560 pthread_attr_init (&attr);
512 pthread_attr_setstacksize (&attr, STACKSIZE); 561 pthread_attr_setstacksize (&attr, STACKSIZE);
513 pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED); 562 pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED);
563#ifdef PTHREAD_SCOPE_PROCESS
564 pthread_attr_setscope (&attr, PTHREAD_SCOPE_PROCESS);
565#endif
514 566
515 sigfillset (&fullsigset); 567 sigfillset (&fullsigset);
568
569 LOCK (wrklock);
516 sigprocmask (SIG_SETMASK, &fullsigset, &oldsigset); 570 sigprocmask (SIG_SETMASK, &fullsigset, &oldsigset);
517 571
518 if (pthread_create (&tid, &attr, aio_proc, 0) == 0) 572 if (pthread_create (&wrk->tid, &attr, aio_proc, (void *)wrk) == 0)
573 {
574 wrk->prev = &wrk_first;
575 wrk->next = wrk_first.next;
576 wrk_first.next->prev = wrk;
577 wrk_first.next = wrk;
519 started++; 578 ++started;
579 }
580 else
581 free (wrk);
520 582
521 sigprocmask (SIG_SETMASK, &oldsigset, 0); 583 sigprocmask (SIG_SETMASK, &oldsigset, 0);
584 UNLOCK (wrklock);
585}
586
587static void maybe_start_thread ()
588{
589 if (get_nthreads () >= wanted)
590 return;
591
592 /* todo: maybe use idle here, but might be less exact */
593 if (0 <= (int)get_nthreads () + (int)get_npending () - (int)nreqs)
594 return;
595
596 start_thread ();
522} 597}
523 598
524static void req_send (aio_req req) 599static void req_send (aio_req req)
525{ 600{
526 while (started < wanted && nreqs >= started)
527 start_thread ();
528
529 ++nreqs; 601 ++nreqs;
530 602
531 pthread_mutex_lock (&reqlock); 603 LOCK (reqlock);
604 ++nready;
532 reqq_push (&req_queue, req); 605 reqq_push (&req_queue, req);
533 pthread_cond_signal (&reqwait); 606 pthread_cond_signal (&reqwait);
534 pthread_mutex_unlock (&reqlock); 607 UNLOCK (reqlock);
535 608
536 if (nreqs > max_outstanding) 609 maybe_start_thread ();
537 for (;;)
538 {
539 poll_cb ();
540
541 if (nreqs <= max_outstanding)
542 break;
543
544 poll_wait ();
545 }
546} 610}
547 611
548static void end_thread (void) 612static void end_thread (void)
549{ 613{
550 aio_req req; 614 aio_req req;
552 Newz (0, req, 1, aio_cb); 616 Newz (0, req, 1, aio_cb);
553 617
554 req->type = REQ_QUIT; 618 req->type = REQ_QUIT;
555 req->pri = PRI_MAX + PRI_BIAS; 619 req->pri = PRI_MAX + PRI_BIAS;
556 620
557 req_send (req); 621 LOCK (reqlock);
622 reqq_push (&req_queue, req);
623 pthread_cond_signal (&reqwait);
624 UNLOCK (reqlock);
625
626 LOCK (wrklock);
627 --started;
628 UNLOCK (wrklock);
629}
630
631static void set_max_idle (int nthreads)
632{
633 if (WORDACCESS_UNSAFE) LOCK (reqlock);
634 max_idle = nthreads <= 0 ? 1 : nthreads;
635 if (WORDACCESS_UNSAFE) UNLOCK (reqlock);
558} 636}
559 637
560static void min_parallel (int nthreads) 638static void min_parallel (int nthreads)
561{ 639{
562 if (wanted < nthreads) 640 if (wanted < nthreads)
563 wanted = nthreads; 641 wanted = nthreads;
564} 642}
565 643
566static void max_parallel (int nthreads) 644static void max_parallel (int nthreads)
567{ 645{
568 int cur = started;
569
570 if (wanted > nthreads) 646 if (wanted > nthreads)
571 wanted = nthreads; 647 wanted = nthreads;
572 648
573 while (cur > wanted)
574 {
575 end_thread ();
576 cur--;
577 }
578
579 while (started > wanted) 649 while (started > wanted)
650 end_thread ();
651}
652
653static void poll_wait ()
654{
655 fd_set rfd;
656
657 while (nreqs)
658 {
659 int size;
660 if (WORDACCESS_UNSAFE) LOCK (reslock);
661 size = res_queue.size;
662 if (WORDACCESS_UNSAFE) UNLOCK (reslock);
663
664 if (size)
665 return;
666
667 maybe_start_thread ();
668
669 FD_ZERO(&rfd);
670 FD_SET(respipe [0], &rfd);
671
672 select (respipe [0] + 1, &rfd, 0, 0, 0);
580 { 673 }
674}
675
676static int poll_cb ()
677{
678 dSP;
679 int count = 0;
680 int maxreqs = max_poll_reqs;
681 int do_croak = 0;
682 struct timeval tv_start, tv_now;
683 aio_req req;
684
685 if (max_poll_time)
686 gettimeofday (&tv_start, 0);
687
688 for (;;)
689 {
690 for (;;)
691 {
692 maybe_start_thread ();
693
694 LOCK (reslock);
695 req = reqq_shift (&res_queue);
696
697 if (req)
698 {
699 --npending;
700
701 if (!res_queue.size)
702 {
703 /* read any signals sent by the worker threads */
704 char buf [32];
705 while (read (respipe [0], buf, 32) == 32)
706 ;
707 }
708 }
709
710 UNLOCK (reslock);
711
712 if (!req)
713 break;
714
715 --nreqs;
716
717 if (req->type == REQ_GROUP && req->length)
718 {
719 req->fd = 1; /* mark request as delayed */
720 continue;
721 }
722 else
723 {
724 if (req->type == REQ_READ)
725 SvCUR_set (req->data, req->dataoffset + (req->result > 0 ? req->result : 0));
726
727 if (req->data2ptr && (req->type == REQ_READ || req->type == REQ_WRITE))
728 SvREADONLY_off (req->data);
729
730 if (req->statdata)
731 {
732 PL_laststype = req->type == REQ_LSTAT ? OP_LSTAT : OP_STAT;
733 PL_laststatval = req->result;
734 PL_statcache = *(req->statdata);
735 }
736
737 req_invoke (req);
738
739 count++;
740 }
741
742 req_free (req);
743
744 if (maxreqs && !--maxreqs)
745 break;
746
747 if (max_poll_time)
748 {
749 gettimeofday (&tv_now, 0);
750
751 if (tvdiff (&tv_start, &tv_now) >= max_poll_time)
752 break;
753 }
754 }
755
756 if (nreqs <= max_outstanding)
757 break;
758
581 poll_wait (); 759 poll_wait ();
582 poll_cb (); 760
761 ++maxreqs;
583 } 762 }
763
764 return count;
584} 765}
585 766
586static void create_pipe () 767static void create_pipe ()
587{ 768{
588 if (pipe (respipe)) 769 if (pipe (respipe))
612static ssize_t pread (int fd, void *buf, size_t count, off_t offset) 793static ssize_t pread (int fd, void *buf, size_t count, off_t offset)
613{ 794{
614 ssize_t res; 795 ssize_t res;
615 off_t ooffset; 796 off_t ooffset;
616 797
617 pthread_mutex_lock (&preadwritelock); 798 LOCK (preadwritelock);
618 ooffset = lseek (fd, 0, SEEK_CUR); 799 ooffset = lseek (fd, 0, SEEK_CUR);
619 lseek (fd, offset, SEEK_SET); 800 lseek (fd, offset, SEEK_SET);
620 res = read (fd, buf, count); 801 res = read (fd, buf, count);
621 lseek (fd, ooffset, SEEK_SET); 802 lseek (fd, ooffset, SEEK_SET);
622 pthread_mutex_unlock (&preadwritelock); 803 UNLOCK (preadwritelock);
623 804
624 return res; 805 return res;
625} 806}
626 807
627static ssize_t pwrite (int fd, void *buf, size_t count, off_t offset) 808static ssize_t pwrite (int fd, void *buf, size_t count, off_t offset)
628{ 809{
629 ssize_t res; 810 ssize_t res;
630 off_t ooffset; 811 off_t ooffset;
631 812
632 pthread_mutex_lock (&preadwritelock); 813 LOCK (preadwritelock);
633 ooffset = lseek (fd, 0, SEEK_CUR); 814 ooffset = lseek (fd, 0, SEEK_CUR);
634 lseek (fd, offset, SEEK_SET); 815 lseek (fd, offset, SEEK_SET);
635 res = write (fd, buf, count); 816 res = write (fd, buf, count);
636 lseek (fd, offset, SEEK_SET); 817 lseek (fd, offset, SEEK_SET);
637 pthread_mutex_unlock (&preadwritelock); 818 UNLOCK (preadwritelock);
638 819
639 return res; 820 return res;
640} 821}
641#endif 822#endif
642 823
643#if !HAVE_FDATASYNC 824#if !HAVE_FDATASYNC
644# define fdatasync fsync 825# define fdatasync fsync
645#endif 826#endif
646 827
647#if !HAVE_READAHEAD 828#if !HAVE_READAHEAD
648# define readahead aio_readahead 829# define readahead(fd,offset,count) aio_readahead (fd, offset, count, self)
649 830
650static ssize_t readahead (int fd, off_t offset, size_t count) 831static ssize_t aio_readahead (int fd, off_t offset, size_t count, worker *self)
651{ 832{
652 dBUF; 833 dBUF;
653 834
654 while (count > 0) 835 while (count > 0)
655 { 836 {
658 pread (fd, aio_buf, len, offset); 839 pread (fd, aio_buf, len, offset);
659 offset += len; 840 offset += len;
660 count -= len; 841 count -= len;
661 } 842 }
662 843
663 fBUF;
664
665 errno = 0; 844 errno = 0;
666} 845}
846
667#endif 847#endif
668 848
669#if !HAVE_READDIR_R 849#if !HAVE_READDIR_R
670# define readdir_r aio_readdir_r 850# define readdir_r aio_readdir_r
671 851
674static int readdir_r (DIR *dirp, struct dirent *ent, struct dirent **res) 854static int readdir_r (DIR *dirp, struct dirent *ent, struct dirent **res)
675{ 855{
676 struct dirent *e; 856 struct dirent *e;
677 int errorno; 857 int errorno;
678 858
679 pthread_mutex_lock (&readdirlock); 859 LOCK (readdirlock);
680 860
681 e = readdir (dirp); 861 e = readdir (dirp);
682 errorno = errno; 862 errorno = errno;
683 863
684 if (e) 864 if (e)
687 strcpy (ent->d_name, e->d_name); 867 strcpy (ent->d_name, e->d_name);
688 } 868 }
689 else 869 else
690 *res = 0; 870 *res = 0;
691 871
692 pthread_mutex_unlock (&readdirlock); 872 UNLOCK (readdirlock);
693 873
694 errno = errorno; 874 errno = errorno;
695 return e ? 0 : -1; 875 return e ? 0 : -1;
696} 876}
697#endif 877#endif
698 878
699/* sendfile always needs emulation */ 879/* sendfile always needs emulation */
700static ssize_t sendfile_ (int ofd, int ifd, off_t offset, size_t count) 880static ssize_t sendfile_ (int ofd, int ifd, off_t offset, size_t count, worker *self)
701{ 881{
702 ssize_t res; 882 ssize_t res;
703 883
704 if (!count) 884 if (!count)
705 return 0; 885 return 0;
716 { 896 {
717 off_t sbytes; 897 off_t sbytes;
718 res = sendfile (ifd, ofd, offset, count, 0, &sbytes, 0); 898 res = sendfile (ifd, ofd, offset, count, 0, &sbytes, 0);
719 899
720 if (res < 0 && sbytes) 900 if (res < 0 && sbytes)
721 /* maybe only on EAGAIN only: as usual, the manpage leaves you guessing */ 901 /* maybe only on EAGAIN: as usual, the manpage leaves you guessing */
722 res = sbytes; 902 res = sbytes;
723 } 903 }
724 904
725# elif __hpux 905# elif __hpux
726 res = sendfile (ofd, ifd, offset, count, 0, 0); 906 res = sendfile (ofd, ifd, offset, count, 0, 0);
782 962
783 offset += cnt; 963 offset += cnt;
784 res += cnt; 964 res += cnt;
785 count -= cnt; 965 count -= cnt;
786 } 966 }
787
788 fBUF;
789 } 967 }
790 968
791 return res; 969 return res;
792} 970}
793 971
794/* read a full directory */ 972/* read a full directory */
795static int scandir_ (const char *path, void **namesp) 973static void scandir_ (aio_req req, worker *self)
796{ 974{
797 DIR *dirp; 975 DIR *dirp;
798 union 976 union
799 { 977 {
800 struct dirent d; 978 struct dirent d;
805 int memlen = 4096; 983 int memlen = 4096;
806 int memofs = 0; 984 int memofs = 0;
807 int res = 0; 985 int res = 0;
808 int errorno; 986 int errorno;
809 987
810 dirp = opendir (path); 988 LOCK (wrklock);
811 if (!dirp) 989 self->dirp = dirp = opendir (req->dataptr);
812 return -1;
813
814 u = malloc (sizeof (*u)); 990 self->dbuf = u = malloc (sizeof (*u));
815 names = malloc (memlen); 991 req->data2ptr = names = malloc (memlen);
992 UNLOCK (wrklock);
816 993
817 if (u && names) 994 if (dirp && u && names)
818 for (;;) 995 for (;;)
819 { 996 {
820 errno = 0; 997 errno = 0;
821 readdir_r (dirp, &u->d, &entp); 998 readdir_r (dirp, &u->d, &entp);
822 999
832 res++; 1009 res++;
833 1010
834 while (memofs + len > memlen) 1011 while (memofs + len > memlen)
835 { 1012 {
836 memlen *= 2; 1013 memlen *= 2;
1014 LOCK (wrklock);
837 names = realloc (names, memlen); 1015 req->data2ptr = names = realloc (names, memlen);
1016 UNLOCK (wrklock);
1017
838 if (!names) 1018 if (!names)
839 break; 1019 break;
840 } 1020 }
841 1021
842 memcpy (names + memofs, name, len); 1022 memcpy (names + memofs, name, len);
843 memofs += len; 1023 memofs += len;
844 } 1024 }
845 } 1025 }
846 1026
847 errorno = errno;
848 free (u);
849 closedir (dirp);
850
851 if (errorno) 1027 if (errno)
852 {
853 free (names);
854 errno = errorno;
855 res = -1; 1028 res = -1;
856 } 1029
857 1030 req->result = res;
858 *namesp = (void *)names;
859 return res;
860} 1031}
861 1032
862/*****************************************************************************/ 1033/*****************************************************************************/
863 1034
864static void *aio_proc (void *thr_arg) 1035static void *aio_proc (void *thr_arg)
865{ 1036{
866 aio_req req; 1037 aio_req req;
867 int type; 1038 struct timespec ts;
1039 worker *self = (worker *)thr_arg;
868 1040
869 do 1041 /* try to distribute timeouts somewhat evenly */
1042 ts.tv_nsec = (((unsigned long)self + (unsigned long)ts.tv_sec) & 1023UL)
1043 * (1000000000UL / 1024UL);
1044
1045 for (;;)
870 { 1046 {
871 pthread_mutex_lock (&reqlock); 1047 ts.tv_sec = time (0) + IDLE_TIMEOUT;
1048
1049 LOCK (reqlock);
872 1050
873 for (;;) 1051 for (;;)
874 { 1052 {
875 req = reqq_shift (&req_queue); 1053 self->req = req = reqq_shift (&req_queue);
876 1054
877 if (req) 1055 if (req)
878 break; 1056 break;
879 1057
1058 ++idle;
1059
1060 if (pthread_cond_timedwait (&reqwait, &reqlock, &ts)
1061 == ETIMEDOUT)
1062 {
1063 if (idle > max_idle)
1064 {
1065 --idle;
1066 UNLOCK (reqlock);
1067 LOCK (wrklock);
1068 --started;
1069 UNLOCK (wrklock);
1070 goto quit;
1071 }
1072
1073 /* we are allowed to idle, so do so without any timeout */
880 pthread_cond_wait (&reqwait, &reqlock); 1074 pthread_cond_wait (&reqwait, &reqlock);
1075 ts.tv_sec = time (0) + IDLE_TIMEOUT;
1076 }
1077
1078 --idle;
881 } 1079 }
882 1080
883 pthread_mutex_unlock (&reqlock); 1081 --nready;
1082
1083 UNLOCK (reqlock);
884 1084
885 errno = 0; /* strictly unnecessary */ 1085 errno = 0; /* strictly unnecessary */
886 type = req->type; /* remember type for QUIT check */
887 1086
888 if (!(req->flags & FLAG_CANCELLED)) 1087 if (!(req->flags & FLAG_CANCELLED))
889 switch (type) 1088 switch (req->type)
890 { 1089 {
891 case REQ_READ: req->result = pread (req->fd, req->dataptr, req->length, req->offset); break; 1090 case REQ_READ: req->result = pread (req->fd, req->dataptr, req->length, req->offset); break;
892 case REQ_WRITE: req->result = pwrite (req->fd, req->dataptr, req->length, req->offset); break; 1091 case REQ_WRITE: req->result = pwrite (req->fd, req->dataptr, req->length, req->offset); break;
893 1092
894 case REQ_READAHEAD: req->result = readahead (req->fd, req->offset, req->length); break; 1093 case REQ_READAHEAD: req->result = readahead (req->fd, req->offset, req->length); break;
895 case REQ_SENDFILE: req->result = sendfile_ (req->fd, req->fd2, req->offset, req->length); break; 1094 case REQ_SENDFILE: req->result = sendfile_ (req->fd, req->fd2, req->offset, req->length, self); break;
896 1095
897 case REQ_STAT: req->result = stat (req->dataptr, req->statdata); break; 1096 case REQ_STAT: req->result = stat (req->dataptr, req->statdata); break;
898 case REQ_LSTAT: req->result = lstat (req->dataptr, req->statdata); break; 1097 case REQ_LSTAT: req->result = lstat (req->dataptr, req->statdata); break;
899 case REQ_FSTAT: req->result = fstat (req->fd , req->statdata); break; 1098 case REQ_FSTAT: req->result = fstat (req->fd , req->statdata); break;
900 1099
903 case REQ_UNLINK: req->result = unlink (req->dataptr); break; 1102 case REQ_UNLINK: req->result = unlink (req->dataptr); break;
904 case REQ_RMDIR: req->result = rmdir (req->dataptr); break; 1103 case REQ_RMDIR: req->result = rmdir (req->dataptr); break;
905 case REQ_RENAME: req->result = rename (req->data2ptr, req->dataptr); break; 1104 case REQ_RENAME: req->result = rename (req->data2ptr, req->dataptr); break;
906 case REQ_LINK: req->result = link (req->data2ptr, req->dataptr); break; 1105 case REQ_LINK: req->result = link (req->data2ptr, req->dataptr); break;
907 case REQ_SYMLINK: req->result = symlink (req->data2ptr, req->dataptr); break; 1106 case REQ_SYMLINK: req->result = symlink (req->data2ptr, req->dataptr); break;
1107 case REQ_MKNOD: req->result = mknod (req->data2ptr, req->mode, (dev_t)req->offset); break;
908 1108
909 case REQ_FDATASYNC: req->result = fdatasync (req->fd); break; 1109 case REQ_FDATASYNC: req->result = fdatasync (req->fd); break;
910 case REQ_FSYNC: req->result = fsync (req->fd); break; 1110 case REQ_FSYNC: req->result = fsync (req->fd); break;
911 case REQ_READDIR: req->result = scandir_ (req->dataptr, &req->data2ptr); break; 1111 case REQ_READDIR: scandir_ (req, self); break;
912 1112
913 case REQ_BUSY: 1113 case REQ_BUSY:
914 { 1114 {
915 struct timeval tv; 1115 struct timeval tv;
916 1116
920 req->result = select (0, 0, 0, 0, &tv); 1120 req->result = select (0, 0, 0, 0, &tv);
921 } 1121 }
922 1122
923 case REQ_GROUP: 1123 case REQ_GROUP:
924 case REQ_NOP: 1124 case REQ_NOP:
1125 break;
1126
925 case REQ_QUIT: 1127 case REQ_QUIT:
926 break; 1128 goto quit;
927 1129
928 default: 1130 default:
929 req->result = ENOSYS; 1131 req->result = ENOSYS;
930 break; 1132 break;
931 } 1133 }
932 1134
933 req->errorno = errno; 1135 req->errorno = errno;
934 1136
935 pthread_mutex_lock (&reslock); 1137 LOCK (reslock);
1138
1139 ++npending;
936 1140
937 if (!reqq_push (&res_queue, req)) 1141 if (!reqq_push (&res_queue, req))
938 /* write a dummy byte to the pipe so fh becomes ready */ 1142 /* write a dummy byte to the pipe so fh becomes ready */
939 write (respipe [1], &respipe, 1); 1143 write (respipe [1], &respipe, 1);
940 1144
941 pthread_mutex_unlock (&reslock); 1145 self->req = 0;
1146 worker_clear (self);
1147
1148 UNLOCK (reslock);
942 } 1149 }
943 while (type != REQ_QUIT); 1150
1151quit:
1152 LOCK (wrklock);
1153 worker_free (self);
1154 UNLOCK (wrklock);
944 1155
945 return 0; 1156 return 0;
946} 1157}
947 1158
948/*****************************************************************************/ 1159/*****************************************************************************/
949 1160
950static void atfork_prepare (void) 1161static void atfork_prepare (void)
951{ 1162{
952 pthread_mutex_lock (&reqlock); 1163 LOCK (wrklock);
953 pthread_mutex_lock (&reslock); 1164 LOCK (reqlock);
1165 LOCK (reslock);
954#if !HAVE_PREADWRITE 1166#if !HAVE_PREADWRITE
955 pthread_mutex_lock (&preadwritelock); 1167 LOCK (preadwritelock);
956#endif 1168#endif
957#if !HAVE_READDIR_R 1169#if !HAVE_READDIR_R
958 pthread_mutex_lock (&readdirlock); 1170 LOCK (readdirlock);
959#endif 1171#endif
960} 1172}
961 1173
962static void atfork_parent (void) 1174static void atfork_parent (void)
963{ 1175{
964#if !HAVE_READDIR_R 1176#if !HAVE_READDIR_R
965 pthread_mutex_unlock (&readdirlock); 1177 UNLOCK (readdirlock);
966#endif 1178#endif
967#if !HAVE_PREADWRITE 1179#if !HAVE_PREADWRITE
968 pthread_mutex_unlock (&preadwritelock); 1180 UNLOCK (preadwritelock);
969#endif 1181#endif
970 pthread_mutex_unlock (&reslock); 1182 UNLOCK (reslock);
971 pthread_mutex_unlock (&reqlock); 1183 UNLOCK (reqlock);
1184 UNLOCK (wrklock);
972} 1185}
973 1186
974static void atfork_child (void) 1187static void atfork_child (void)
975{ 1188{
976 aio_req prv; 1189 aio_req prv;
977
978 started = 0;
979 1190
980 while (prv = reqq_shift (&req_queue)) 1191 while (prv = reqq_shift (&req_queue))
981 req_free (prv); 1192 req_free (prv);
982 1193
983 while (prv = reqq_shift (&res_queue)) 1194 while (prv = reqq_shift (&res_queue))
984 req_free (prv); 1195 req_free (prv);
985 1196
1197 while (wrk_first.next != &wrk_first)
1198 {
1199 worker *wrk = wrk_first.next;
1200
1201 if (wrk->req)
1202 req_free (wrk->req);
1203
1204 worker_clear (wrk);
1205 worker_free (wrk);
1206 }
1207
1208 started = 0;
1209 idle = 0;
1210 nreqs = 0;
1211 nready = 0;
1212 npending = 0;
1213
986 close (respipe [0]); 1214 close (respipe [0]);
987 close (respipe [1]); 1215 close (respipe [1]);
988 create_pipe (); 1216 create_pipe ();
989 1217
990 atfork_parent (); 1218 atfork_parent ();
1016PROTOTYPES: ENABLE 1244PROTOTYPES: ENABLE
1017 1245
1018BOOT: 1246BOOT:
1019{ 1247{
1020 HV *stash = gv_stashpv ("IO::AIO", 1); 1248 HV *stash = gv_stashpv ("IO::AIO", 1);
1249
1021 newCONSTSUB (stash, "EXDEV", newSViv (EXDEV)); 1250 newCONSTSUB (stash, "EXDEV", newSViv (EXDEV));
1022 newCONSTSUB (stash, "O_RDONLY", newSViv (O_RDONLY)); 1251 newCONSTSUB (stash, "O_RDONLY", newSViv (O_RDONLY));
1023 newCONSTSUB (stash, "O_WRONLY", newSViv (O_WRONLY)); 1252 newCONSTSUB (stash, "O_WRONLY", newSViv (O_WRONLY));
1253 newCONSTSUB (stash, "O_CREAT", newSViv (O_CREAT));
1254 newCONSTSUB (stash, "O_TRUNC", newSViv (O_TRUNC));
1255 newCONSTSUB (stash, "S_IFIFO", newSViv (S_IFIFO));
1024 1256
1025 create_pipe (); 1257 create_pipe ();
1026 pthread_atfork (atfork_prepare, atfork_parent, atfork_child); 1258 pthread_atfork (atfork_prepare, atfork_parent, atfork_child);
1027} 1259}
1028 1260
1029void 1261void
1030min_parallel (nthreads) 1262max_poll_reqs (int nreqs)
1031 int nthreads
1032 PROTOTYPE: $ 1263 PROTOTYPE: $
1264 CODE:
1265 max_poll_reqs = nreqs;
1033 1266
1034void 1267void
1035max_parallel (nthreads) 1268max_poll_time (double nseconds)
1036 int nthreads
1037 PROTOTYPE: $ 1269 PROTOTYPE: $
1270 CODE:
1271 max_poll_time = nseconds * AIO_TICKS;
1272
1273void
1274min_parallel (int nthreads)
1275 PROTOTYPE: $
1276
1277void
1278max_parallel (int nthreads)
1279 PROTOTYPE: $
1280
1281void
1282max_idle (int nthreads)
1283 PROTOTYPE: $
1284 CODE:
1285 set_max_idle (nthreads);
1038 1286
1039int 1287int
1040max_outstanding (nreqs) 1288max_outstanding (int maxreqs)
1041 int nreqs 1289 PROTOTYPE: $
1042 PROTOTYPE: $
1043 CODE: 1290 CODE:
1044 RETVAL = max_outstanding; 1291 RETVAL = max_outstanding;
1045 max_outstanding = nreqs; 1292 max_outstanding = maxreqs;
1293 OUTPUT:
1294 RETVAL
1046 1295
1047void 1296void
1048aio_open (pathname,flags,mode,callback=&PL_sv_undef) 1297aio_open (pathname,flags,mode,callback=&PL_sv_undef)
1049 SV * pathname 1298 SV * pathname
1050 int flags 1299 int flags
1265 1514
1266 REQ_SEND; 1515 REQ_SEND;
1267} 1516}
1268 1517
1269void 1518void
1519aio_mknod (pathname,mode,dev,callback=&PL_sv_undef)
1520 SV * pathname
1521 SV * callback
1522 UV mode
1523 UV dev
1524 PPCODE:
1525{
1526 dREQ;
1527
1528 req->type = REQ_MKNOD;
1529 req->data = newSVsv (pathname);
1530 req->dataptr = SvPVbyte_nolen (req->data);
1531 req->mode = (mode_t)mode;
1532 req->offset = dev;
1533
1534 REQ_SEND;
1535}
1536
1537void
1270aio_busy (delay,callback=&PL_sv_undef) 1538aio_busy (delay,callback=&PL_sv_undef)
1271 double delay 1539 double delay
1272 SV * callback 1540 SV * callback
1273 PPCODE: 1541 PPCODE:
1274{ 1542{
1305 req->type = REQ_NOP; 1573 req->type = REQ_NOP;
1306 1574
1307 REQ_SEND; 1575 REQ_SEND;
1308} 1576}
1309 1577
1310void 1578int
1311aioreq_pri (int pri = DEFAULT_PRI) 1579aioreq_pri (int pri = 0)
1312 CODE: 1580 PROTOTYPE: ;$
1581 CODE:
1582 RETVAL = next_pri - PRI_BIAS;
1583 if (items > 0)
1584 {
1313 if (pri < PRI_MIN) pri = PRI_MIN; 1585 if (pri < PRI_MIN) pri = PRI_MIN;
1314 if (pri > PRI_MAX) pri = PRI_MAX; 1586 if (pri > PRI_MAX) pri = PRI_MAX;
1315 next_pri = pri + PRI_BIAS; 1587 next_pri = pri + PRI_BIAS;
1588 }
1589 OUTPUT:
1590 RETVAL
1316 1591
1317void 1592void
1318aioreq_nice (int nice = 0) 1593aioreq_nice (int nice = 0)
1319 CODE: 1594 CODE:
1320 nice = next_pri - nice; 1595 nice = next_pri - nice;
1321 if (nice < PRI_MIN) nice = PRI_MIN; 1596 if (nice < PRI_MIN) nice = PRI_MIN;
1322 if (nice > PRI_MAX) nice = PRI_MAX; 1597 if (nice > PRI_MAX) nice = PRI_MAX;
1323 next_pri = nice + PRI_BIAS; 1598 next_pri = nice + PRI_BIAS;
1324 1599
1325void 1600void
1326flush () 1601flush ()
1327 PROTOTYPE: 1602 PROTOTYPE:
1328 CODE: 1603 CODE:
1329 while (nreqs) 1604 while (nreqs)
1330 { 1605 {
1331 poll_wait (); 1606 poll_wait ();
1332 poll_cb (); 1607 poll_cb (0);
1333 } 1608 }
1334 1609
1335void 1610void
1336poll() 1611poll()
1337 PROTOTYPE: 1612 PROTOTYPE:
1338 CODE: 1613 CODE:
1339 if (nreqs) 1614 if (nreqs)
1340 { 1615 {
1341 poll_wait (); 1616 poll_wait ();
1342 poll_cb (); 1617 poll_cb (0);
1343 } 1618 }
1344 1619
1345int 1620int
1346poll_fileno() 1621poll_fileno()
1347 PROTOTYPE: 1622 PROTOTYPE:
1371 CODE: 1646 CODE:
1372 RETVAL = nreqs; 1647 RETVAL = nreqs;
1373 OUTPUT: 1648 OUTPUT:
1374 RETVAL 1649 RETVAL
1375 1650
1651int
1652nready()
1653 PROTOTYPE:
1654 CODE:
1655 RETVAL = get_nready ();
1656 OUTPUT:
1657 RETVAL
1658
1659int
1660npending()
1661 PROTOTYPE:
1662 CODE:
1663 RETVAL = get_npending ();
1664 OUTPUT:
1665 RETVAL
1666
1667int
1668nthreads()
1669 PROTOTYPE:
1670 CODE:
1671 if (WORDACCESS_UNSAFE) LOCK (wrklock);
1672 RETVAL = started;
1673 if (WORDACCESS_UNSAFE) UNLOCK (wrklock);
1674 OUTPUT:
1675 RETVAL
1676
1376PROTOTYPES: DISABLE 1677PROTOTYPES: DISABLE
1377 1678
1378MODULE = IO::AIO PACKAGE = IO::AIO::REQ 1679MODULE = IO::AIO PACKAGE = IO::AIO::REQ
1379 1680
1380void 1681void
1422 } 1723 }
1423 } 1724 }
1424} 1725}
1425 1726
1426void 1727void
1728cancel_subs (aio_req_ornot req)
1729 CODE:
1730 req_cancel_subs (req);
1731
1732void
1427result (aio_req grp, ...) 1733result (aio_req grp, ...)
1428 CODE: 1734 CODE:
1429{ 1735{
1430 int i; 1736 int i;
1737 AV *av;
1738
1739 grp->errorno = errno;
1740
1431 AV *av = newAV (); 1741 av = newAV ();
1432 1742
1433 for (i = 1; i < items; ++i ) 1743 for (i = 1; i < items; ++i )
1434 av_push (av, newSVsv (ST (i))); 1744 av_push (av, newSVsv (ST (i)));
1435 1745
1436 SvREFCNT_dec (grp->data); 1746 SvREFCNT_dec (grp->data);
1437 grp->data = (SV *)av; 1747 grp->data = (SV *)av;
1438} 1748}
1749
1750void
1751errno (aio_req grp, int errorno = errno)
1752 CODE:
1753 grp->errorno = errorno;
1439 1754
1440void 1755void
1441limit (aio_req grp, int limit) 1756limit (aio_req grp, int limit)
1442 CODE: 1757 CODE:
1443 grp->fd2 = limit; 1758 grp->fd2 = limit;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines