ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/IO-AIO/AIO.xs
(Generate patch)

Comparing IO-AIO/AIO.xs (file contents):
Revision 1.79 by root, Thu Oct 26 16:28:33 2006 UTC vs.
Revision 1.84 by root, Sat Oct 28 01:24:19 2006 UTC

43# else 43# else
44# error sendfile support requested but not available 44# error sendfile support requested but not available
45# endif 45# endif
46#endif 46#endif
47 47
48/* number of seconds after which idle threads exit */
49#define IDLE_TIMEOUT 10
50
48/* used for struct dirent, AIX doesn't provide it */ 51/* used for struct dirent, AIX doesn't provide it */
49#ifndef NAME_MAX 52#ifndef NAME_MAX
50# define NAME_MAX 4096 53# define NAME_MAX 4096
51#endif 54#endif
52 55
92 REQ_READ, REQ_WRITE, REQ_READAHEAD, 95 REQ_READ, REQ_WRITE, REQ_READAHEAD,
93 REQ_SENDFILE, 96 REQ_SENDFILE,
94 REQ_STAT, REQ_LSTAT, REQ_FSTAT, 97 REQ_STAT, REQ_LSTAT, REQ_FSTAT,
95 REQ_FSYNC, REQ_FDATASYNC, 98 REQ_FSYNC, REQ_FDATASYNC,
96 REQ_UNLINK, REQ_RMDIR, REQ_RENAME, 99 REQ_UNLINK, REQ_RMDIR, REQ_RENAME,
97 REQ_READDIR, 100 REQ_MKNOD, REQ_READDIR,
98 REQ_LINK, REQ_SYMLINK, 101 REQ_LINK, REQ_SYMLINK,
99 REQ_GROUP, REQ_NOP, 102 REQ_GROUP, REQ_NOP,
100 REQ_BUSY, 103 REQ_BUSY,
101}; 104};
102 105
144 NUM_PRI = PRI_MAX + PRI_BIAS + 1, 147 NUM_PRI = PRI_MAX + PRI_BIAS + 1,
145}; 148};
146 149
147static int next_pri = DEFAULT_PRI + PRI_BIAS; 150static int next_pri = DEFAULT_PRI + PRI_BIAS;
148 151
149static unsigned int started, wanted; 152static unsigned int started, idle, wanted;
150static volatile unsigned int nreqs, nready, npending;
151static volatile unsigned int max_outstanding = 0xffffffff;
152static int respipe [2];
153 153
154#if __linux && defined (PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP) 154#if __linux && defined (PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP)
155# define AIO_MUTEX_INIT PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP 155# define AIO_MUTEX_INIT PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP
156#else 156#else
157# define AIO_MUTEX_INIT PTHREAD_MUTEX_INITIALIZER 157# define AIO_MUTEX_INIT PTHREAD_MUTEX_INITIALIZER
198 wrk->prev->next = wrk->next; 198 wrk->prev->next = wrk->next;
199 199
200 free (wrk); 200 free (wrk);
201} 201}
202 202
203static volatile unsigned int nreqs, nready, npending;
204static volatile unsigned int max_idle = 4;
205static volatile unsigned int max_outstanding = 0xffffffff;
206static int respipe [2];
207
203static pthread_mutex_t reslock = AIO_MUTEX_INIT; 208static pthread_mutex_t reslock = AIO_MUTEX_INIT;
204static pthread_mutex_t reqlock = AIO_MUTEX_INIT; 209static pthread_mutex_t reqlock = AIO_MUTEX_INIT;
205static pthread_cond_t reqwait = PTHREAD_COND_INITIALIZER; 210static pthread_cond_t reqwait = PTHREAD_COND_INITIALIZER;
211
212#if WORDREAD_UNSAFE
213
214static unsigned int get_nready ()
215{
216 unsigned int retval;
217
218 LOCK (reqlock);
219 retval = nready;
220 UNLOCK (reqlock);
221
222 return retval;
223}
224
225static unsigned int get_npending ()
226{
227 unsigned int retval;
228
229 LOCK (reslock);
230 retval = npending;
231 UNLOCK (reslock);
232
233 return retval;
234}
235
236#else
237
238# define get_nready() nready
239# define get_npending() npending
240
241#endif
206 242
207/* 243/*
208 * a somewhat faster data structure might be nice, but 244 * a somewhat faster data structure might be nice, but
209 * with 8 priorities this actually needs <20 insns 245 * with 8 priorities this actually needs <20 insns
210 * per shift, the most expensive operation. 246 * per shift, the most expensive operation.
331 req_invoke (grp); 367 req_invoke (grp);
332 req_free (grp); 368 req_free (grp);
333 } 369 }
334} 370}
335 371
336static void poll_wait ()
337{
338 fd_set rfd;
339
340 while (nreqs)
341 {
342 int size;
343 if (WORDREAD_UNSAFE) LOCK (reslock);
344 size = res_queue.size;
345 if (WORDREAD_UNSAFE) UNLOCK (reslock);
346
347 if (size)
348 return;
349
350 FD_ZERO(&rfd);
351 FD_SET(respipe [0], &rfd);
352
353 select (respipe [0] + 1, &rfd, 0, 0, 0);
354 }
355}
356
357static void req_invoke (aio_req req) 372static void req_invoke (aio_req req)
358{ 373{
359 dSP; 374 dSP;
360 375
361 if (!(req->flags & FLAG_CANCELLED) && SvOK (req->callback)) 376 if (!(req->flags & FLAG_CANCELLED) && SvOK (req->callback))
504 req->flags |= FLAG_CANCELLED; 519 req->flags |= FLAG_CANCELLED;
505 520
506 req_cancel_subs (req); 521 req_cancel_subs (req);
507} 522}
508 523
524static void *aio_proc(void *arg);
525
526static void start_thread (void)
527{
528 sigset_t fullsigset, oldsigset;
529 pthread_attr_t attr;
530
531 worker *wrk = calloc (1, sizeof (worker));
532
533 if (!wrk)
534 croak ("unable to allocate worker thread data");
535
536 pthread_attr_init (&attr);
537 pthread_attr_setstacksize (&attr, STACKSIZE);
538 pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED);
539#ifdef PTHREAD_SCOPE_PROCESS
540 pthread_attr_setscope (&attr, PTHREAD_SCOPE_PROCESS);
541#endif
542
543 sigfillset (&fullsigset);
544
545 LOCK (wrklock);
546 sigprocmask (SIG_SETMASK, &fullsigset, &oldsigset);
547
548 if (pthread_create (&wrk->tid, &attr, aio_proc, (void *)wrk) == 0)
549 {
550 wrk->prev = &wrk_first;
551 wrk->next = wrk_first.next;
552 wrk_first.next->prev = wrk;
553 wrk_first.next = wrk;
554 ++started;
555 }
556 else
557 free (wrk);
558
559 sigprocmask (SIG_SETMASK, &oldsigset, 0);
560 UNLOCK (wrklock);
561}
562
563static void maybe_start_thread ()
564{
565 if (started >= wanted)
566 return;
567
568 /* todo: maybe use idle here, but might be less exact */
569 if ((int)nready <= (int)started - (int)(nreqs - get_nready () - get_npending ()))
570 return;
571
572 start_thread ();
573}
574
575static void req_send (aio_req req)
576{
577 ++nreqs;
578
579 LOCK (reqlock);
580 ++nready;
581 reqq_push (&req_queue, req);
582 pthread_cond_signal (&reqwait);
583 UNLOCK (reqlock);
584
585 maybe_start_thread ();
586}
587
588static void end_thread (void)
589{
590 aio_req req;
591
592 Newz (0, req, 1, aio_cb);
593
594 req->type = REQ_QUIT;
595 req->pri = PRI_MAX + PRI_BIAS;
596
597 LOCK (reqlock);
598 reqq_push (&req_queue, req);
599 pthread_cond_signal (&reqwait);
600 UNLOCK (reqlock);
601
602 LOCK (wrklock);
603 --started;
604 UNLOCK (wrklock);
605}
606
607static void min_parallel (int nthreads)
608{
609 if (wanted < nthreads)
610 wanted = nthreads;
611}
612
613static void max_parallel (int nthreads)
614{
615 if (wanted > nthreads)
616 wanted = nthreads;
617
618 while (started > wanted)
619 end_thread ();
620}
621
622static void poll_wait ()
623{
624 fd_set rfd;
625
626 while (nreqs)
627 {
628 int size;
629 if (WORDREAD_UNSAFE) LOCK (reslock);
630 size = res_queue.size;
631 if (WORDREAD_UNSAFE) UNLOCK (reslock);
632
633 if (size)
634 return;
635
636 maybe_start_thread ();
637
638 FD_ZERO(&rfd);
639 FD_SET(respipe [0], &rfd);
640
641 select (respipe [0] + 1, &rfd, 0, 0, 0);
642 }
643}
644
509static int poll_cb (int max) 645static int poll_cb (int max)
510{ 646{
511 dSP; 647 dSP;
512 int count = 0; 648 int count = 0;
513 int do_croak = 0; 649 int do_croak = 0;
515 651
516 for (;;) 652 for (;;)
517 { 653 {
518 while (max <= 0 || count < max) 654 while (max <= 0 || count < max)
519 { 655 {
656 maybe_start_thread ();
657
520 LOCK (reslock); 658 LOCK (reslock);
521 req = reqq_shift (&res_queue); 659 req = reqq_shift (&res_queue);
522 660
523 if (req) 661 if (req)
524 { 662 {
538 if (!req) 676 if (!req)
539 break; 677 break;
540 678
541 --nreqs; 679 --nreqs;
542 680
543 if (req->type == REQ_QUIT)
544 --started;
545 else if (req->type == REQ_GROUP && req->length) 681 if (req->type == REQ_GROUP && req->length)
546 { 682 {
547 req->fd = 1; /* mark request as delayed */ 683 req->fd = 1; /* mark request as delayed */
548 continue; 684 continue;
549 } 685 }
550 else 686 else
577 713
578 max = 0; 714 max = 0;
579 } 715 }
580 716
581 return count; 717 return count;
582}
583
584static void *aio_proc(void *arg);
585
586static void start_thread (void)
587{
588 sigset_t fullsigset, oldsigset;
589 pthread_attr_t attr;
590
591 worker *wrk = calloc (1, sizeof (worker));
592
593 if (!wrk)
594 croak ("unable to allocate worker thread data");
595
596 pthread_attr_init (&attr);
597 pthread_attr_setstacksize (&attr, STACKSIZE);
598 pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED);
599
600 sigfillset (&fullsigset);
601
602 LOCK (wrklock);
603 sigprocmask (SIG_SETMASK, &fullsigset, &oldsigset);
604
605 if (pthread_create (&wrk->tid, &attr, aio_proc, (void *)wrk) == 0)
606 {
607 wrk->prev = &wrk_first;
608 wrk->next = wrk_first.next;
609 wrk_first.next->prev = wrk;
610 wrk_first.next = wrk;
611 ++started;
612 }
613 else
614 free (wrk);
615
616 sigprocmask (SIG_SETMASK, &oldsigset, 0);
617 UNLOCK (wrklock);
618}
619
620static void req_send (aio_req req)
621{
622 while (started < wanted && nreqs >= started)
623 start_thread ();
624
625 ++nreqs;
626
627 LOCK (reqlock);
628 ++nready;
629 reqq_push (&req_queue, req);
630 pthread_cond_signal (&reqwait);
631 UNLOCK (reqlock);
632}
633
634static void end_thread (void)
635{
636 aio_req req;
637
638 Newz (0, req, 1, aio_cb);
639
640 req->type = REQ_QUIT;
641 req->pri = PRI_MAX + PRI_BIAS;
642
643 req_send (req);
644}
645
646static void min_parallel (int nthreads)
647{
648 if (wanted < nthreads)
649 wanted = nthreads;
650}
651
652static void max_parallel (int nthreads)
653{
654 int cur = started;
655
656 if (wanted > nthreads)
657 wanted = nthreads;
658
659 while (cur > wanted)
660 {
661 end_thread ();
662 cur--;
663 }
664
665 while (started > wanted)
666 {
667 poll_wait ();
668 poll_cb (0);
669 }
670} 718}
671 719
672static void create_pipe () 720static void create_pipe ()
673{ 721{
674 if (pipe (respipe)) 722 if (pipe (respipe))
938/*****************************************************************************/ 986/*****************************************************************************/
939 987
940static void *aio_proc (void *thr_arg) 988static void *aio_proc (void *thr_arg)
941{ 989{
942 aio_req req; 990 aio_req req;
943 int type; 991 struct timespec ts;
944 worker *self = (worker *)thr_arg; 992 worker *self = (worker *)thr_arg;
945 993
946 do 994 /* try to distribute timeouts somewhat evenly */
995 ts.tv_nsec = (((unsigned long)self + (unsigned long)ts.tv_sec) & 1023UL)
996 * (1000000000UL / 1024UL);
997
998 for (;;)
947 { 999 {
1000 ts.tv_sec = time (0) + IDLE_TIMEOUT;
1001
948 LOCK (reqlock); 1002 LOCK (reqlock);
949 1003
950 for (;;) 1004 for (;;)
951 { 1005 {
952 self->req = req = reqq_shift (&req_queue); 1006 self->req = req = reqq_shift (&req_queue);
953 1007
954 if (req) 1008 if (req)
955 break; 1009 break;
956 1010
1011 ++idle;
1012
1013 if (pthread_cond_timedwait (&reqwait, &reqlock, &ts)
1014 == ETIMEDOUT)
1015 {
1016 if (idle > max_idle)
1017 {
1018 --idle;
1019 UNLOCK (reqlock);
1020 LOCK (wrklock);
1021 --started;
1022 UNLOCK (wrklock);
1023 goto quit;
1024 }
1025
1026 /* we are allowed to idle, so do so without any timeout */
957 pthread_cond_wait (&reqwait, &reqlock); 1027 pthread_cond_wait (&reqwait, &reqlock);
1028 ts.tv_sec = time (0) + IDLE_TIMEOUT;
1029 }
1030
1031 --idle;
958 } 1032 }
959 1033
960 --nready; 1034 --nready;
961 1035
962 UNLOCK (reqlock); 1036 UNLOCK (reqlock);
963 1037
964 errno = 0; /* strictly unnecessary */ 1038 errno = 0; /* strictly unnecessary */
965 type = req->type; /* remember type for QUIT check */
966 1039
967 if (!(req->flags & FLAG_CANCELLED)) 1040 if (!(req->flags & FLAG_CANCELLED))
968 switch (type) 1041 switch (req->type)
969 { 1042 {
970 case REQ_READ: req->result = pread (req->fd, req->dataptr, req->length, req->offset); break; 1043 case REQ_READ: req->result = pread (req->fd, req->dataptr, req->length, req->offset); break;
971 case REQ_WRITE: req->result = pwrite (req->fd, req->dataptr, req->length, req->offset); break; 1044 case REQ_WRITE: req->result = pwrite (req->fd, req->dataptr, req->length, req->offset); break;
972 1045
973 case REQ_READAHEAD: req->result = readahead (req->fd, req->offset, req->length); break; 1046 case REQ_READAHEAD: req->result = readahead (req->fd, req->offset, req->length); break;
982 case REQ_UNLINK: req->result = unlink (req->dataptr); break; 1055 case REQ_UNLINK: req->result = unlink (req->dataptr); break;
983 case REQ_RMDIR: req->result = rmdir (req->dataptr); break; 1056 case REQ_RMDIR: req->result = rmdir (req->dataptr); break;
984 case REQ_RENAME: req->result = rename (req->data2ptr, req->dataptr); break; 1057 case REQ_RENAME: req->result = rename (req->data2ptr, req->dataptr); break;
985 case REQ_LINK: req->result = link (req->data2ptr, req->dataptr); break; 1058 case REQ_LINK: req->result = link (req->data2ptr, req->dataptr); break;
986 case REQ_SYMLINK: req->result = symlink (req->data2ptr, req->dataptr); break; 1059 case REQ_SYMLINK: req->result = symlink (req->data2ptr, req->dataptr); break;
1060 case REQ_MKNOD: req->result = mknod (req->data2ptr, req->mode, (dev_t)req->offset); break;
987 1061
988 case REQ_FDATASYNC: req->result = fdatasync (req->fd); break; 1062 case REQ_FDATASYNC: req->result = fdatasync (req->fd); break;
989 case REQ_FSYNC: req->result = fsync (req->fd); break; 1063 case REQ_FSYNC: req->result = fsync (req->fd); break;
990 case REQ_READDIR: scandir_ (req, self); break; 1064 case REQ_READDIR: scandir_ (req, self); break;
991 1065
999 req->result = select (0, 0, 0, 0, &tv); 1073 req->result = select (0, 0, 0, 0, &tv);
1000 } 1074 }
1001 1075
1002 case REQ_GROUP: 1076 case REQ_GROUP:
1003 case REQ_NOP: 1077 case REQ_NOP:
1078 break;
1079
1004 case REQ_QUIT: 1080 case REQ_QUIT:
1005 break; 1081 goto quit;
1006 1082
1007 default: 1083 default:
1008 req->result = ENOSYS; 1084 req->result = ENOSYS;
1009 break; 1085 break;
1010 } 1086 }
1022 self->req = 0; 1098 self->req = 0;
1023 worker_clear (self); 1099 worker_clear (self);
1024 1100
1025 UNLOCK (reslock); 1101 UNLOCK (reslock);
1026 } 1102 }
1027 while (type != REQ_QUIT);
1028 1103
1104quit:
1029 LOCK (wrklock); 1105 LOCK (wrklock);
1030 worker_free (self); 1106 worker_free (self);
1031 UNLOCK (wrklock); 1107 UNLOCK (wrklock);
1032 1108
1033 return 0; 1109 return 0;
1080 1156
1081 worker_clear (wrk); 1157 worker_clear (wrk);
1082 worker_free (wrk); 1158 worker_free (wrk);
1083 } 1159 }
1084 1160
1085 started = 0; 1161 started = 0;
1162 idle = 0;
1086 nreqs = 0; 1163 nreqs = 0;
1164 nready = 0;
1165 npending = 0;
1087 1166
1088 close (respipe [0]); 1167 close (respipe [0]);
1089 close (respipe [1]); 1168 close (respipe [1]);
1090 create_pipe (); 1169 create_pipe ();
1091 1170
1118PROTOTYPES: ENABLE 1197PROTOTYPES: ENABLE
1119 1198
1120BOOT: 1199BOOT:
1121{ 1200{
1122 HV *stash = gv_stashpv ("IO::AIO", 1); 1201 HV *stash = gv_stashpv ("IO::AIO", 1);
1202
1123 newCONSTSUB (stash, "EXDEV", newSViv (EXDEV)); 1203 newCONSTSUB (stash, "EXDEV", newSViv (EXDEV));
1124 newCONSTSUB (stash, "O_RDONLY", newSViv (O_RDONLY)); 1204 newCONSTSUB (stash, "O_RDONLY", newSViv (O_RDONLY));
1125 newCONSTSUB (stash, "O_WRONLY", newSViv (O_WRONLY)); 1205 newCONSTSUB (stash, "O_WRONLY", newSViv (O_WRONLY));
1206 newCONSTSUB (stash, "O_CREAT", newSViv (O_CREAT));
1207 newCONSTSUB (stash, "O_TRUNC", newSViv (O_TRUNC));
1208 newCONSTSUB (stash, "S_IFIFO", newSViv (S_IFIFO));
1126 1209
1127 create_pipe (); 1210 create_pipe ();
1128 pthread_atfork (atfork_prepare, atfork_parent, atfork_child); 1211 pthread_atfork (atfork_prepare, atfork_parent, atfork_child);
1129} 1212}
1130 1213
1361 req->type = ix; 1444 req->type = ix;
1362 req->fh = newSVsv (oldpath); 1445 req->fh = newSVsv (oldpath);
1363 req->data2ptr = SvPVbyte_nolen (req->fh); 1446 req->data2ptr = SvPVbyte_nolen (req->fh);
1364 req->data = newSVsv (newpath); 1447 req->data = newSVsv (newpath);
1365 req->dataptr = SvPVbyte_nolen (req->data); 1448 req->dataptr = SvPVbyte_nolen (req->data);
1449
1450 REQ_SEND;
1451}
1452
1453void
1454aio_mknod (pathname,mode,dev,callback=&PL_sv_undef)
1455 SV * pathname
1456 SV * callback
1457 UV mode
1458 UV dev
1459 PPCODE:
1460{
1461 dREQ;
1462
1463 req->type = REQ_MKNOD;
1464 req->data = newSVsv (pathname);
1465 req->dataptr = SvPVbyte_nolen (req->data);
1466 req->mode = (mode_t)mode;
1467 req->offset = dev;
1366 1468
1367 REQ_SEND; 1469 REQ_SEND;
1368} 1470}
1369 1471
1370void 1472void
1491 1593
1492int 1594int
1493nready() 1595nready()
1494 PROTOTYPE: 1596 PROTOTYPE:
1495 CODE: 1597 CODE:
1496 if (WORDREAD_UNSAFE) LOCK (reqlock);
1497 RETVAL = nready; 1598 RETVAL = get_nready ();
1498 if (WORDREAD_UNSAFE) UNLOCK (reqlock);
1499 OUTPUT: 1599 OUTPUT:
1500 RETVAL 1600 RETVAL
1501 1601
1502int 1602int
1503npending() 1603npending()
1504 PROTOTYPE: 1604 PROTOTYPE:
1505 CODE: 1605 CODE:
1506 if (WORDREAD_UNSAFE) LOCK (reslock);
1507 RETVAL = npending; 1606 RETVAL = get_npending ();
1508 if (WORDREAD_UNSAFE) UNLOCK (reslock);
1509 OUTPUT: 1607 OUTPUT:
1510 RETVAL 1608 RETVAL
1511 1609
1512PROTOTYPES: DISABLE 1610PROTOTYPES: DISABLE
1513 1611

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines