ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/IO-AIO/AIO.xs
Revision: 1.73
Committed: Tue Oct 24 21:26:30 2006 UTC (17 years, 6 months ago) by root
Branch: MAIN
Changes since 1.72: +3 -3 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 /* solaris */
2 #define _POSIX_PTHREAD_SEMANTICS 1
3
4 #if __linux
5 # define _GNU_SOURCE
6 #endif
7
8 #define _REENTRANT 1
9
10 #include <errno.h>
11
12 #include "EXTERN.h"
13 #include "perl.h"
14 #include "XSUB.h"
15
16 #include "autoconf/config.h"
17
18 #include <pthread.h>
19
20 #include <stddef.h>
21 #include <errno.h>
22 #include <sys/time.h>
23 #include <sys/select.h>
24 #include <sys/types.h>
25 #include <sys/stat.h>
26 #include <limits.h>
27 #include <unistd.h>
28 #include <fcntl.h>
29 #include <signal.h>
30 #include <sched.h>
31
32 #if HAVE_SENDFILE
33 # if __linux
34 # include <sys/sendfile.h>
35 # elif __freebsd
36 # include <sys/socket.h>
37 # include <sys/uio.h>
38 # elif __hpux
39 # include <sys/socket.h>
40 # elif __solaris /* not yet */
41 # include <sys/sendfile.h>
42 # else
43 # error sendfile support requested but not available
44 # endif
45 #endif
46
47 /* used for struct dirent, AIX doesn't provide it */
48 #ifndef NAME_MAX
49 # define NAME_MAX 4096
50 #endif
51
52 #if __ia64
53 # define STACKSIZE 65536
54 #elif __i386 || __x86_64 /* 16k is unreasonably high :( */
55 # define STACKSIZE PTHREAD_STACK_MIN
56 #else
57 # define STACKSIZE 16384
58 #endif
59
60 /* buffer size for various temporary buffers */
61 #define AIO_BUFSIZE 65536
62
63 #define dBUF \
64 char *aio_buf; \
65 LOCK (wrklock); \
66 self->dbuf = aio_buf = malloc (AIO_BUFSIZE); \
67 UNLOCK (wrklock); \
68 if (!aio_buf) \
69 return -1;
70
71 enum {
72 REQ_QUIT,
73 REQ_OPEN, REQ_CLOSE,
74 REQ_READ, REQ_WRITE, REQ_READAHEAD,
75 REQ_SENDFILE,
76 REQ_STAT, REQ_LSTAT, REQ_FSTAT,
77 REQ_FSYNC, REQ_FDATASYNC,
78 REQ_UNLINK, REQ_RMDIR, REQ_RENAME,
79 REQ_READDIR,
80 REQ_LINK, REQ_SYMLINK,
81 REQ_GROUP, REQ_NOP,
82 REQ_BUSY,
83 };
84
85 #define AIO_REQ_KLASS "IO::AIO::REQ"
86 #define AIO_GRP_KLASS "IO::AIO::GRP"
87
88 typedef struct aio_cb
89 {
90 struct aio_cb *volatile next;
91
92 SV *data, *callback;
93 SV *fh, *fh2;
94 void *dataptr, *data2ptr;
95 Stat_t *statdata;
96 off_t offset;
97 size_t length;
98 ssize_t result;
99
100 STRLEN dataoffset;
101 int type;
102 int fd, fd2;
103 int errorno;
104 mode_t mode; /* open */
105
106 unsigned char flags;
107 unsigned char pri;
108
109 SV *self; /* the perl counterpart of this request, if any */
110 struct aio_cb *grp, *grp_prev, *grp_next, *grp_first;
111 } aio_cb;
112
113 enum {
114 FLAG_CANCELLED = 0x01,
115 };
116
117 typedef aio_cb *aio_req;
118 typedef aio_cb *aio_req_ornot;
119
120 enum {
121 PRI_MIN = -4,
122 PRI_MAX = 4,
123
124 DEFAULT_PRI = 0,
125 PRI_BIAS = -PRI_MIN,
126 NUM_PRI = PRI_MAX + PRI_BIAS + 1,
127 };
128
129 static int next_pri = DEFAULT_PRI + PRI_BIAS;
130
131 static int started, wanted;
132 static volatile int nreqs;
133 static int max_outstanding = 1<<30;
134 static int respipe [2];
135
136 #if __linux && defined (PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP)
137 # define AIO_MUTEX_INIT PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP
138 #else
139 # define AIO_MUTEX_INIT PTHREAD_MUTEX_INITIALIZER
140 #endif
141
142 #define LOCK(mutex) pthread_mutex_lock (&(mutex))
143 #define UNLOCK(mutex) pthread_mutex_unlock (&(mutex))
144
145 /* worker threasd management */
146 static pthread_mutex_t wrklock = AIO_MUTEX_INIT;
147
148 typedef struct worker {
149 /* locked by wrklock */
150 struct worker *prev, *next;
151
152 pthread_t tid;
153
154 /* locked by reslock, reqlock or wrklock */
155 aio_req req; /* currently processed request */
156 void *dbuf;
157 DIR *dirp;
158 } worker;
159
160 static worker wrk_first = { &wrk_first, &wrk_first, 0 };
161
162 static void worker_clear (worker *wrk)
163 {
164 if (wrk->dirp)
165 {
166 closedir (wrk->dirp);
167 wrk->dirp = 0;
168 }
169
170 if (wrk->dbuf)
171 {
172 free (wrk->dbuf);
173 wrk->dbuf = 0;
174 }
175 }
176
177 static void worker_free (worker *wrk)
178 {
179 wrk->next->prev = wrk->prev;
180 wrk->prev->next = wrk->next;
181
182 free (wrk);
183 }
184
185 static pthread_mutex_t reslock = AIO_MUTEX_INIT;
186 static pthread_mutex_t reqlock = AIO_MUTEX_INIT;
187 static pthread_cond_t reqwait = PTHREAD_COND_INITIALIZER;
188
189 /*
190 * a somewhat faster data structure might be nice, but
191 * with 8 priorities this actually needs <20 insns
192 * per shift, the most expensive operation.
193 */
194 typedef struct {
195 aio_req qs[NUM_PRI], qe[NUM_PRI]; /* qstart, qend */
196 int size;
197 } reqq;
198
199 static reqq req_queue;
200 static reqq res_queue;
201
202 int reqq_push (reqq *q, aio_req req)
203 {
204 int pri = req->pri;
205 req->next = 0;
206
207 if (q->qe[pri])
208 {
209 q->qe[pri]->next = req;
210 q->qe[pri] = req;
211 }
212 else
213 q->qe[pri] = q->qs[pri] = req;
214
215 return q->size++;
216 }
217
218 aio_req reqq_shift (reqq *q)
219 {
220 int pri;
221
222 if (!q->size)
223 return 0;
224
225 --q->size;
226
227 for (pri = NUM_PRI; pri--; )
228 {
229 aio_req req = q->qs[pri];
230
231 if (req)
232 {
233 if (!(q->qs[pri] = req->next))
234 q->qe[pri] = 0;
235
236 return req;
237 }
238 }
239
240 abort ();
241 }
242
243 static void req_invoke (aio_req req);
244 static void req_free (aio_req req);
245 static void req_cancel (aio_req req);
246
247 /* must be called at most once */
248 static SV *req_sv (aio_req req, const char *klass)
249 {
250 if (!req->self)
251 {
252 req->self = (SV *)newHV ();
253 sv_magic (req->self, 0, PERL_MAGIC_ext, (char *)req, 0);
254 }
255
256 return sv_2mortal (sv_bless (newRV_inc (req->self), gv_stashpv (klass, 1)));
257 }
258
259 static aio_req SvAIO_REQ (SV *sv)
260 {
261 MAGIC *mg;
262
263 if (!sv_derived_from (sv, AIO_REQ_KLASS) || !SvROK (sv))
264 croak ("object of class " AIO_REQ_KLASS " expected");
265
266 mg = mg_find (SvRV (sv), PERL_MAGIC_ext);
267
268 return mg ? (aio_req)mg->mg_ptr : 0;
269 }
270
271 static void aio_grp_feed (aio_req grp)
272 {
273 while (grp->length < grp->fd2 && !(grp->flags & FLAG_CANCELLED))
274 {
275 int old_len = grp->length;
276
277 if (grp->fh2 && SvOK (grp->fh2))
278 {
279 dSP;
280
281 ENTER;
282 SAVETMPS;
283 PUSHMARK (SP);
284 XPUSHs (req_sv (grp, AIO_GRP_KLASS));
285 PUTBACK;
286 call_sv (grp->fh2, G_VOID | G_EVAL | G_KEEPERR);
287 SPAGAIN;
288 FREETMPS;
289 LEAVE;
290 }
291
292 /* stop if no progress has been made */
293 if (old_len == grp->length)
294 {
295 SvREFCNT_dec (grp->fh2);
296 grp->fh2 = 0;
297 break;
298 }
299 }
300 }
301
302 static void aio_grp_dec (aio_req grp)
303 {
304 --grp->length;
305
306 /* call feeder, if applicable */
307 aio_grp_feed (grp);
308
309 /* finish, if done */
310 if (!grp->length && grp->fd)
311 {
312 req_invoke (grp);
313 req_free (grp);
314 }
315 }
316
317 static void poll_wait ()
318 {
319 fd_set rfd;
320
321 while (nreqs)
322 {
323 int size;
324 #if !(__i386 || __x86_64) /* safe without sempahore on these archs */
325 LOCK (reslock);
326 #endif
327 size = res_queue.size;
328 #if !(__i386 || __x86_64) /* safe without sempahore on these archs */
329 UNLOCK (reslock);
330 #endif
331
332 if (size)
333 return;
334
335 FD_ZERO(&rfd);
336 FD_SET(respipe [0], &rfd);
337
338 select (respipe [0] + 1, &rfd, 0, 0, 0);
339 }
340 }
341
342 static void req_invoke (aio_req req)
343 {
344 dSP;
345
346 if (!(req->flags & FLAG_CANCELLED) && SvOK (req->callback))
347 {
348 errno = req->errorno;
349
350 ENTER;
351 SAVETMPS;
352 PUSHMARK (SP);
353 EXTEND (SP, 1);
354
355 switch (req->type)
356 {
357 case REQ_READDIR:
358 {
359 SV *rv = &PL_sv_undef;
360
361 if (req->result >= 0)
362 {
363 int i;
364 char *buf = req->data2ptr;
365 AV *av = newAV ();
366
367 av_extend (av, req->result - 1);
368
369 for (i = 0; i < req->result; ++i)
370 {
371 SV *sv = newSVpv (buf, 0);
372
373 av_store (av, i, sv);
374 buf += SvCUR (sv) + 1;
375 }
376
377 rv = sv_2mortal (newRV_noinc ((SV *)av));
378 }
379
380 PUSHs (rv);
381 }
382 break;
383
384 case REQ_OPEN:
385 {
386 /* convert fd to fh */
387 SV *fh;
388
389 PUSHs (sv_2mortal (newSViv (req->result)));
390 PUTBACK;
391 call_pv ("IO::AIO::_fd2fh", G_SCALAR | G_EVAL);
392 SPAGAIN;
393
394 fh = SvREFCNT_inc (POPs);
395
396 PUSHMARK (SP);
397 XPUSHs (sv_2mortal (fh));
398 }
399 break;
400
401 case REQ_GROUP:
402 req->fd = 2; /* mark group as finished */
403
404 if (req->data)
405 {
406 int i;
407 AV *av = (AV *)req->data;
408
409 EXTEND (SP, AvFILL (av) + 1);
410 for (i = 0; i <= AvFILL (av); ++i)
411 PUSHs (*av_fetch (av, i, 0));
412 }
413 break;
414
415 case REQ_NOP:
416 case REQ_BUSY:
417 break;
418
419 default:
420 PUSHs (sv_2mortal (newSViv (req->result)));
421 break;
422 }
423
424
425 PUTBACK;
426 call_sv (req->callback, G_VOID | G_EVAL);
427 SPAGAIN;
428
429 FREETMPS;
430 LEAVE;
431 }
432
433 if (req->grp)
434 {
435 aio_req grp = req->grp;
436
437 /* unlink request */
438 if (req->grp_next) req->grp_next->grp_prev = req->grp_prev;
439 if (req->grp_prev) req->grp_prev->grp_next = req->grp_next;
440
441 if (grp->grp_first == req)
442 grp->grp_first = req->grp_next;
443
444 aio_grp_dec (grp);
445 }
446
447 if (SvTRUE (ERRSV))
448 {
449 req_free (req);
450 croak (0);
451 }
452 }
453
454 static void req_free (aio_req req)
455 {
456 if (req->self)
457 {
458 sv_unmagic (req->self, PERL_MAGIC_ext);
459 SvREFCNT_dec (req->self);
460 }
461
462 SvREFCNT_dec (req->data);
463 SvREFCNT_dec (req->fh);
464 SvREFCNT_dec (req->fh2);
465 SvREFCNT_dec (req->callback);
466 Safefree (req->statdata);
467
468 if (req->type == REQ_READDIR)
469 free (req->data2ptr);
470
471 Safefree (req);
472 }
473
474 static void req_cancel_subs (aio_req grp)
475 {
476 aio_req sub;
477
478 if (grp->type != REQ_GROUP)
479 return;
480
481 SvREFCNT_dec (grp->fh2);
482 grp->fh2 = 0;
483
484 for (sub = grp->grp_first; sub; sub = sub->grp_next)
485 req_cancel (sub);
486 }
487
488 static void req_cancel (aio_req req)
489 {
490 req->flags |= FLAG_CANCELLED;
491
492 req_cancel_subs (req);
493 }
494
495 static int poll_cb ()
496 {
497 dSP;
498 int count = 0;
499 int do_croak = 0;
500 aio_req req;
501
502 for (;;)
503 {
504 LOCK (reslock);
505 req = reqq_shift (&res_queue);
506
507 if (req)
508 {
509 if (!res_queue.size)
510 {
511 /* read any signals sent by the worker threads */
512 char buf [32];
513 while (read (respipe [0], buf, 32) == 32)
514 ;
515 }
516 }
517
518 UNLOCK (reslock);
519
520 if (!req)
521 break;
522
523 --nreqs;
524
525 if (req->type == REQ_QUIT)
526 started--;
527 else if (req->type == REQ_GROUP && req->length)
528 {
529 req->fd = 1; /* mark request as delayed */
530 continue;
531 }
532 else
533 {
534 if (req->type == REQ_READ)
535 SvCUR_set (req->data, req->dataoffset + (req->result > 0 ? req->result : 0));
536
537 if (req->data2ptr && (req->type == REQ_READ || req->type == REQ_WRITE))
538 SvREADONLY_off (req->data);
539
540 if (req->statdata)
541 {
542 PL_laststype = req->type == REQ_LSTAT ? OP_LSTAT : OP_STAT;
543 PL_laststatval = req->result;
544 PL_statcache = *(req->statdata);
545 }
546
547 req_invoke (req);
548
549 count++;
550 }
551
552 req_free (req);
553 }
554
555 return count;
556 }
557
558 static void *aio_proc(void *arg);
559
560 static void start_thread (void)
561 {
562 sigset_t fullsigset, oldsigset;
563 pthread_attr_t attr;
564
565 worker *wrk = calloc (1, sizeof (worker));
566
567 if (!wrk)
568 croak ("unable to allocate worker thread data");
569
570 pthread_attr_init (&attr);
571 pthread_attr_setstacksize (&attr, STACKSIZE);
572 pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED);
573
574 sigfillset (&fullsigset);
575
576 LOCK (wrklock);
577 sigprocmask (SIG_SETMASK, &fullsigset, &oldsigset);
578
579 if (pthread_create (&wrk->tid, &attr, aio_proc, (void *)wrk) == 0)
580 {
581 wrk->prev = &wrk_first;
582 wrk->next = wrk_first.next;
583 wrk_first.next->prev = wrk;
584 wrk_first.next = wrk;
585 started++;
586 }
587 else
588 free (wrk);
589
590 sigprocmask (SIG_SETMASK, &oldsigset, 0);
591 UNLOCK (wrklock);
592 }
593
594 static void req_send (aio_req req)
595 {
596 while (started < wanted && nreqs >= started)
597 start_thread ();
598
599 ++nreqs;
600
601 LOCK (reqlock);
602 reqq_push (&req_queue, req);
603 pthread_cond_signal (&reqwait);
604 UNLOCK (reqlock);
605
606 if (nreqs > max_outstanding)
607 for (;;)
608 {
609 poll_cb ();
610
611 if (nreqs <= max_outstanding)
612 break;
613
614 poll_wait ();
615 }
616 }
617
618 static void end_thread (void)
619 {
620 aio_req req;
621
622 Newz (0, req, 1, aio_cb);
623
624 req->type = REQ_QUIT;
625 req->pri = PRI_MAX + PRI_BIAS;
626
627 req_send (req);
628 }
629
630 static void min_parallel (int nthreads)
631 {
632 if (wanted < nthreads)
633 wanted = nthreads;
634 }
635
636 static void max_parallel (int nthreads)
637 {
638 int cur = started;
639
640 if (wanted > nthreads)
641 wanted = nthreads;
642
643 while (cur > wanted)
644 {
645 end_thread ();
646 cur--;
647 }
648
649 while (started > wanted)
650 {
651 poll_wait ();
652 poll_cb ();
653 }
654 }
655
656 static void create_pipe ()
657 {
658 if (pipe (respipe))
659 croak ("unable to initialize result pipe");
660
661 if (fcntl (respipe [0], F_SETFL, O_NONBLOCK))
662 croak ("cannot set result pipe to nonblocking mode");
663
664 if (fcntl (respipe [1], F_SETFL, O_NONBLOCK))
665 croak ("cannot set result pipe to nonblocking mode");
666 }
667
668 /*****************************************************************************/
669 /* work around various missing functions */
670
671 #if !HAVE_PREADWRITE
672 # define pread aio_pread
673 # define pwrite aio_pwrite
674
675 /*
676 * make our pread/pwrite safe against themselves, but not against
677 * normal read/write by using a mutex. slows down execution a lot,
678 * but that's your problem, not mine.
679 */
680 static pthread_mutex_t preadwritelock = PTHREAD_MUTEX_INITIALIZER;
681
682 static ssize_t pread (int fd, void *buf, size_t count, off_t offset)
683 {
684 ssize_t res;
685 off_t ooffset;
686
687 LOCK (preadwritelock);
688 ooffset = lseek (fd, 0, SEEK_CUR);
689 lseek (fd, offset, SEEK_SET);
690 res = read (fd, buf, count);
691 lseek (fd, ooffset, SEEK_SET);
692 UNLOCK (preadwritelock);
693
694 return res;
695 }
696
697 static ssize_t pwrite (int fd, void *buf, size_t count, off_t offset)
698 {
699 ssize_t res;
700 off_t ooffset;
701
702 LOCK (preadwritelock);
703 ooffset = lseek (fd, 0, SEEK_CUR);
704 lseek (fd, offset, SEEK_SET);
705 res = write (fd, buf, count);
706 lseek (fd, offset, SEEK_SET);
707 UNLOCK (preadwritelock);
708
709 return res;
710 }
711 #endif
712
713 #if !HAVE_FDATASYNC
714 # define fdatasync fsync
715 #endif
716
717 #if !HAVE_READAHEAD
718 # define readahead aio_readahead
719
720 static ssize_t readahead (int fd, off_t offset, size_t count)
721 {
722 dBUF;
723
724 while (count > 0)
725 {
726 size_t len = count < AIO_BUFSIZE ? count : AIO_BUFSIZE;
727
728 pread (fd, aio_buf, len, offset);
729 offset += len;
730 count -= len;
731 }
732
733 errno = 0;
734 }
735 #endif
736
737 #if !HAVE_READDIR_R
738 # define readdir_r aio_readdir_r
739
740 static pthread_mutex_t readdirlock = PTHREAD_MUTEX_INITIALIZER;
741
742 static int readdir_r (DIR *dirp, struct dirent *ent, struct dirent **res)
743 {
744 struct dirent *e;
745 int errorno;
746
747 LOCK (readdirlock);
748
749 e = readdir (dirp);
750 errorno = errno;
751
752 if (e)
753 {
754 *res = ent;
755 strcpy (ent->d_name, e->d_name);
756 }
757 else
758 *res = 0;
759
760 UNLOCK (readdirlock);
761
762 errno = errorno;
763 return e ? 0 : -1;
764 }
765 #endif
766
767 /* sendfile always needs emulation */
768 static ssize_t sendfile_ (int ofd, int ifd, off_t offset, size_t count, worker *self)
769 {
770 ssize_t res;
771
772 if (!count)
773 return 0;
774
775 #if HAVE_SENDFILE
776 # if __linux
777 res = sendfile (ofd, ifd, &offset, count);
778
779 # elif __freebsd
780 /*
781 * Of course, the freebsd sendfile is a dire hack with no thoughts
782 * wasted on making it similar to other I/O functions.
783 */
784 {
785 off_t sbytes;
786 res = sendfile (ifd, ofd, offset, count, 0, &sbytes, 0);
787
788 if (res < 0 && sbytes)
789 /* maybe only on EAGAIN only: as usual, the manpage leaves you guessing */
790 res = sbytes;
791 }
792
793 # elif __hpux
794 res = sendfile (ofd, ifd, offset, count, 0, 0);
795
796 # elif __solaris
797 {
798 struct sendfilevec vec;
799 size_t sbytes;
800
801 vec.sfv_fd = ifd;
802 vec.sfv_flag = 0;
803 vec.sfv_off = offset;
804 vec.sfv_len = count;
805
806 res = sendfilev (ofd, &vec, 1, &sbytes);
807
808 if (res < 0 && sbytes)
809 res = sbytes;
810 }
811
812 # endif
813 #else
814 res = -1;
815 errno = ENOSYS;
816 #endif
817
818 if (res < 0
819 && (errno == ENOSYS || errno == EINVAL || errno == ENOTSOCK
820 #if __solaris
821 || errno == EAFNOSUPPORT || errno == EPROTOTYPE
822 #endif
823 )
824 )
825 {
826 /* emulate sendfile. this is a major pain in the ass */
827 dBUF;
828
829 res = 0;
830
831 while (count)
832 {
833 ssize_t cnt;
834
835 cnt = pread (ifd, aio_buf, count > AIO_BUFSIZE ? AIO_BUFSIZE : count, offset);
836
837 if (cnt <= 0)
838 {
839 if (cnt && !res) res = -1;
840 break;
841 }
842
843 cnt = write (ofd, aio_buf, cnt);
844
845 if (cnt <= 0)
846 {
847 if (cnt && !res) res = -1;
848 break;
849 }
850
851 offset += cnt;
852 res += cnt;
853 count -= cnt;
854 }
855 }
856
857 return res;
858 }
859
860 /* read a full directory */
861 static void scandir_ (aio_req req, worker *self)
862 {
863 DIR *dirp;
864 union
865 {
866 struct dirent d;
867 char b [offsetof (struct dirent, d_name) + NAME_MAX + 1];
868 } *u;
869 struct dirent *entp;
870 char *name, *names;
871 int memlen = 4096;
872 int memofs = 0;
873 int res = 0;
874 int errorno;
875
876 LOCK (wrklock);
877 self->dirp = dirp = opendir (req->dataptr);
878 self->dbuf = u = malloc (sizeof (*u));
879 UNLOCK (wrklock);
880
881 req->data2ptr = names = malloc (memlen);
882
883 if (dirp && u && names)
884 for (;;)
885 {
886 errno = 0;
887 readdir_r (dirp, &u->d, &entp);
888
889 if (!entp)
890 break;
891
892 name = entp->d_name;
893
894 if (name [0] != '.' || (name [1] && (name [1] != '.' || name [2])))
895 {
896 int len = strlen (name) + 1;
897
898 res++;
899
900 while (memofs + len > memlen)
901 {
902 memlen *= 2;
903 LOCK (wrklock);
904 req->data2ptr = names = realloc (names, memlen);
905 UNLOCK (wrklock);
906
907 if (!names)
908 break;
909 }
910
911 memcpy (names + memofs, name, len);
912 memofs += len;
913 }
914 }
915
916 if (errno)
917 res = -1;
918
919 req->result = res;
920 }
921
922 /*****************************************************************************/
923
924 static void *aio_proc (void *thr_arg)
925 {
926 aio_req req;
927 int type;
928 worker *self = (worker *)thr_arg;
929
930 do
931 {
932 LOCK (reqlock);
933
934 for (;;)
935 {
936 self->req = req = reqq_shift (&req_queue);
937
938 if (req)
939 break;
940
941 pthread_cond_wait (&reqwait, &reqlock);
942 }
943
944 UNLOCK (reqlock);
945
946 errno = 0; /* strictly unnecessary */
947 type = req->type; /* remember type for QUIT check */
948
949 if (!(req->flags & FLAG_CANCELLED))
950 switch (type)
951 {
952 case REQ_READ: req->result = pread (req->fd, req->dataptr, req->length, req->offset); break;
953 case REQ_WRITE: req->result = pwrite (req->fd, req->dataptr, req->length, req->offset); break;
954
955 case REQ_READAHEAD: req->result = readahead (req->fd, req->offset, req->length); break;
956 case REQ_SENDFILE: req->result = sendfile_ (req->fd, req->fd2, req->offset, req->length, self); break;
957
958 case REQ_STAT: req->result = stat (req->dataptr, req->statdata); break;
959 case REQ_LSTAT: req->result = lstat (req->dataptr, req->statdata); break;
960 case REQ_FSTAT: req->result = fstat (req->fd , req->statdata); break;
961
962 case REQ_OPEN: req->result = open (req->dataptr, req->fd, req->mode); break;
963 case REQ_CLOSE: req->result = close (req->fd); break;
964 case REQ_UNLINK: req->result = unlink (req->dataptr); break;
965 case REQ_RMDIR: req->result = rmdir (req->dataptr); break;
966 case REQ_RENAME: req->result = rename (req->data2ptr, req->dataptr); break;
967 case REQ_LINK: req->result = link (req->data2ptr, req->dataptr); break;
968 case REQ_SYMLINK: req->result = symlink (req->data2ptr, req->dataptr); break;
969
970 case REQ_FDATASYNC: req->result = fdatasync (req->fd); break;
971 case REQ_FSYNC: req->result = fsync (req->fd); break;
972 case REQ_READDIR: scandir_ (req, self); break;
973
974 case REQ_BUSY:
975 {
976 struct timeval tv;
977
978 tv.tv_sec = req->fd;
979 tv.tv_usec = req->fd2;
980
981 req->result = select (0, 0, 0, 0, &tv);
982 }
983
984 case REQ_GROUP:
985 case REQ_NOP:
986 case REQ_QUIT:
987 break;
988
989 default:
990 req->result = ENOSYS;
991 break;
992 }
993
994 req->errorno = errno;
995
996 LOCK (reslock);
997
998 if (!reqq_push (&res_queue, req))
999 /* write a dummy byte to the pipe so fh becomes ready */
1000 write (respipe [1], &respipe, 1);
1001
1002 self->req = 0;
1003 worker_clear (self);
1004
1005 UNLOCK (reslock);
1006 }
1007 while (type != REQ_QUIT);
1008
1009 LOCK (wrklock);
1010 worker_free (self);
1011 UNLOCK (wrklock);
1012
1013 return 0;
1014 }
1015
1016 /*****************************************************************************/
1017
1018 static void atfork_prepare (void)
1019 {
1020 LOCK (wrklock);
1021 LOCK (reqlock);
1022 LOCK (reslock);
1023 #if !HAVE_PREADWRITE
1024 LOCK (preadwritelock);
1025 #endif
1026 #if !HAVE_READDIR_R
1027 LOCK (readdirlock);
1028 #endif
1029 }
1030
1031 static void atfork_parent (void)
1032 {
1033 #if !HAVE_READDIR_R
1034 UNLOCK (readdirlock);
1035 #endif
1036 #if !HAVE_PREADWRITE
1037 UNLOCK (preadwritelock);
1038 #endif
1039 UNLOCK (reslock);
1040 UNLOCK (reqlock);
1041 UNLOCK (wrklock);
1042 }
1043
1044 static void atfork_child (void)
1045 {
1046 aio_req prv;
1047
1048 while (prv = reqq_shift (&req_queue))
1049 req_free (prv);
1050
1051 while (prv = reqq_shift (&res_queue))
1052 req_free (prv);
1053
1054 while (wrk_first.next != &wrk_first)
1055 {
1056 worker *wrk = wrk_first.next;
1057
1058 if (wrk->req)
1059 req_free (wrk->req);
1060
1061 worker_clear (wrk);
1062 worker_free (wrk);
1063 }
1064
1065 started = 0;
1066 nreqs = 0;
1067
1068 close (respipe [0]);
1069 close (respipe [1]);
1070 create_pipe ();
1071
1072 atfork_parent ();
1073 }
1074
1075 #define dREQ \
1076 aio_req req; \
1077 int req_pri = next_pri; \
1078 next_pri = DEFAULT_PRI + PRI_BIAS; \
1079 \
1080 if (SvOK (callback) && !SvROK (callback)) \
1081 croak ("callback must be undef or of reference type"); \
1082 \
1083 Newz (0, req, 1, aio_cb); \
1084 if (!req) \
1085 croak ("out of memory during aio_req allocation"); \
1086 \
1087 req->callback = newSVsv (callback); \
1088 req->pri = req_pri
1089
1090 #define REQ_SEND \
1091 req_send (req); \
1092 \
1093 if (GIMME_V != G_VOID) \
1094 XPUSHs (req_sv (req, AIO_REQ_KLASS));
1095
1096 MODULE = IO::AIO PACKAGE = IO::AIO
1097
1098 PROTOTYPES: ENABLE
1099
1100 BOOT:
1101 {
1102 HV *stash = gv_stashpv ("IO::AIO", 1);
1103 newCONSTSUB (stash, "EXDEV", newSViv (EXDEV));
1104 newCONSTSUB (stash, "O_RDONLY", newSViv (O_RDONLY));
1105 newCONSTSUB (stash, "O_WRONLY", newSViv (O_WRONLY));
1106
1107 create_pipe ();
1108 pthread_atfork (atfork_prepare, atfork_parent, atfork_child);
1109 }
1110
1111 void
1112 min_parallel (nthreads)
1113 int nthreads
1114 PROTOTYPE: $
1115
1116 void
1117 max_parallel (nthreads)
1118 int nthreads
1119 PROTOTYPE: $
1120
1121 int
1122 max_outstanding (nreqs)
1123 int nreqs
1124 PROTOTYPE: $
1125 CODE:
1126 RETVAL = max_outstanding;
1127 max_outstanding = nreqs;
1128
1129 void
1130 aio_open (pathname,flags,mode,callback=&PL_sv_undef)
1131 SV * pathname
1132 int flags
1133 int mode
1134 SV * callback
1135 PROTOTYPE: $$$;$
1136 PPCODE:
1137 {
1138 dREQ;
1139
1140 req->type = REQ_OPEN;
1141 req->data = newSVsv (pathname);
1142 req->dataptr = SvPVbyte_nolen (req->data);
1143 req->fd = flags;
1144 req->mode = mode;
1145
1146 REQ_SEND;
1147 }
1148
1149 void
1150 aio_close (fh,callback=&PL_sv_undef)
1151 SV * fh
1152 SV * callback
1153 PROTOTYPE: $;$
1154 ALIAS:
1155 aio_close = REQ_CLOSE
1156 aio_fsync = REQ_FSYNC
1157 aio_fdatasync = REQ_FDATASYNC
1158 PPCODE:
1159 {
1160 dREQ;
1161
1162 req->type = ix;
1163 req->fh = newSVsv (fh);
1164 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh)));
1165
1166 REQ_SEND (req);
1167 }
1168
1169 void
1170 aio_read (fh,offset,length,data,dataoffset,callback=&PL_sv_undef)
1171 SV * fh
1172 UV offset
1173 UV length
1174 SV * data
1175 UV dataoffset
1176 SV * callback
1177 ALIAS:
1178 aio_read = REQ_READ
1179 aio_write = REQ_WRITE
1180 PROTOTYPE: $$$$$;$
1181 PPCODE:
1182 {
1183 aio_req req;
1184 STRLEN svlen;
1185 char *svptr = SvPVbyte (data, svlen);
1186
1187 SvUPGRADE (data, SVt_PV);
1188 SvPOK_on (data);
1189
1190 if (dataoffset < 0)
1191 dataoffset += svlen;
1192
1193 if (dataoffset < 0 || dataoffset > svlen)
1194 croak ("data offset outside of string");
1195
1196 if (ix == REQ_WRITE)
1197 {
1198 /* write: check length and adjust. */
1199 if (length < 0 || length + dataoffset > svlen)
1200 length = svlen - dataoffset;
1201 }
1202 else
1203 {
1204 /* read: grow scalar as necessary */
1205 svptr = SvGROW (data, length + dataoffset);
1206 }
1207
1208 if (length < 0)
1209 croak ("length must not be negative");
1210
1211 {
1212 dREQ;
1213
1214 req->type = ix;
1215 req->fh = newSVsv (fh);
1216 req->fd = PerlIO_fileno (ix == REQ_READ ? IoIFP (sv_2io (fh))
1217 : IoOFP (sv_2io (fh)));
1218 req->offset = offset;
1219 req->length = length;
1220 req->data = SvREFCNT_inc (data);
1221 req->dataptr = (char *)svptr + dataoffset;
1222
1223 if (!SvREADONLY (data))
1224 {
1225 SvREADONLY_on (data);
1226 req->data2ptr = (void *)data;
1227 }
1228
1229 REQ_SEND;
1230 }
1231 }
1232
1233 void
1234 aio_sendfile (out_fh,in_fh,in_offset,length,callback=&PL_sv_undef)
1235 SV * out_fh
1236 SV * in_fh
1237 UV in_offset
1238 UV length
1239 SV * callback
1240 PROTOTYPE: $$$$;$
1241 PPCODE:
1242 {
1243 dREQ;
1244
1245 req->type = REQ_SENDFILE;
1246 req->fh = newSVsv (out_fh);
1247 req->fd = PerlIO_fileno (IoIFP (sv_2io (out_fh)));
1248 req->fh2 = newSVsv (in_fh);
1249 req->fd2 = PerlIO_fileno (IoIFP (sv_2io (in_fh)));
1250 req->offset = in_offset;
1251 req->length = length;
1252
1253 REQ_SEND;
1254 }
1255
1256 void
1257 aio_readahead (fh,offset,length,callback=&PL_sv_undef)
1258 SV * fh
1259 UV offset
1260 IV length
1261 SV * callback
1262 PROTOTYPE: $$$;$
1263 PPCODE:
1264 {
1265 dREQ;
1266
1267 req->type = REQ_READAHEAD;
1268 req->fh = newSVsv (fh);
1269 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh)));
1270 req->offset = offset;
1271 req->length = length;
1272
1273 REQ_SEND;
1274 }
1275
1276 void
1277 aio_stat (fh_or_path,callback=&PL_sv_undef)
1278 SV * fh_or_path
1279 SV * callback
1280 ALIAS:
1281 aio_stat = REQ_STAT
1282 aio_lstat = REQ_LSTAT
1283 PPCODE:
1284 {
1285 dREQ;
1286
1287 New (0, req->statdata, 1, Stat_t);
1288 if (!req->statdata)
1289 {
1290 req_free (req);
1291 croak ("out of memory during aio_req->statdata allocation");
1292 }
1293
1294 if (SvPOK (fh_or_path))
1295 {
1296 req->type = ix;
1297 req->data = newSVsv (fh_or_path);
1298 req->dataptr = SvPVbyte_nolen (req->data);
1299 }
1300 else
1301 {
1302 req->type = REQ_FSTAT;
1303 req->fh = newSVsv (fh_or_path);
1304 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh_or_path)));
1305 }
1306
1307 REQ_SEND;
1308 }
1309
1310 void
1311 aio_unlink (pathname,callback=&PL_sv_undef)
1312 SV * pathname
1313 SV * callback
1314 ALIAS:
1315 aio_unlink = REQ_UNLINK
1316 aio_rmdir = REQ_RMDIR
1317 aio_readdir = REQ_READDIR
1318 PPCODE:
1319 {
1320 dREQ;
1321
1322 req->type = ix;
1323 req->data = newSVsv (pathname);
1324 req->dataptr = SvPVbyte_nolen (req->data);
1325
1326 REQ_SEND;
1327 }
1328
1329 void
1330 aio_link (oldpath,newpath,callback=&PL_sv_undef)
1331 SV * oldpath
1332 SV * newpath
1333 SV * callback
1334 ALIAS:
1335 aio_link = REQ_LINK
1336 aio_symlink = REQ_SYMLINK
1337 aio_rename = REQ_RENAME
1338 PPCODE:
1339 {
1340 dREQ;
1341
1342 req->type = ix;
1343 req->fh = newSVsv (oldpath);
1344 req->data2ptr = SvPVbyte_nolen (req->fh);
1345 req->data = newSVsv (newpath);
1346 req->dataptr = SvPVbyte_nolen (req->data);
1347
1348 REQ_SEND;
1349 }
1350
1351 void
1352 aio_busy (delay,callback=&PL_sv_undef)
1353 double delay
1354 SV * callback
1355 PPCODE:
1356 {
1357 dREQ;
1358
1359 req->type = REQ_BUSY;
1360 req->fd = delay < 0. ? 0 : delay;
1361 req->fd2 = delay < 0. ? 0 : 1000. * (delay - req->fd);
1362
1363 REQ_SEND;
1364 }
1365
1366 void
1367 aio_group (callback=&PL_sv_undef)
1368 SV * callback
1369 PROTOTYPE: ;$
1370 PPCODE:
1371 {
1372 dREQ;
1373
1374 req->type = REQ_GROUP;
1375 req_send (req);
1376
1377 XPUSHs (req_sv (req, AIO_GRP_KLASS));
1378 }
1379
1380 void
1381 aio_nop (callback=&PL_sv_undef)
1382 SV * callback
1383 PPCODE:
1384 {
1385 dREQ;
1386
1387 req->type = REQ_NOP;
1388
1389 REQ_SEND;
1390 }
1391
1392 void
1393 aioreq_pri (int pri = DEFAULT_PRI)
1394 CODE:
1395 if (pri < PRI_MIN) pri = PRI_MIN;
1396 if (pri > PRI_MAX) pri = PRI_MAX;
1397 next_pri = pri + PRI_BIAS;
1398
1399 void
1400 aioreq_nice (int nice = 0)
1401 CODE:
1402 nice = next_pri - nice;
1403 if (nice < PRI_MIN) nice = PRI_MIN;
1404 if (nice > PRI_MAX) nice = PRI_MAX;
1405 next_pri = nice + PRI_BIAS;
1406
1407 void
1408 flush ()
1409 PROTOTYPE:
1410 CODE:
1411 while (nreqs)
1412 {
1413 poll_wait ();
1414 poll_cb ();
1415 }
1416
1417 void
1418 poll()
1419 PROTOTYPE:
1420 CODE:
1421 if (nreqs)
1422 {
1423 poll_wait ();
1424 poll_cb ();
1425 }
1426
1427 int
1428 poll_fileno()
1429 PROTOTYPE:
1430 CODE:
1431 RETVAL = respipe [0];
1432 OUTPUT:
1433 RETVAL
1434
1435 int
1436 poll_cb(...)
1437 PROTOTYPE:
1438 CODE:
1439 RETVAL = poll_cb ();
1440 OUTPUT:
1441 RETVAL
1442
1443 void
1444 poll_wait()
1445 PROTOTYPE:
1446 CODE:
1447 if (nreqs)
1448 poll_wait ();
1449
1450 int
1451 nreqs()
1452 PROTOTYPE:
1453 CODE:
1454 RETVAL = nreqs;
1455 OUTPUT:
1456 RETVAL
1457
1458 PROTOTYPES: DISABLE
1459
1460 MODULE = IO::AIO PACKAGE = IO::AIO::REQ
1461
1462 void
1463 cancel (aio_req_ornot req)
1464 CODE:
1465 req_cancel (req);
1466
1467 void
1468 cb (aio_req_ornot req, SV *callback=&PL_sv_undef)
1469 CODE:
1470 SvREFCNT_dec (req->callback);
1471 req->callback = newSVsv (callback);
1472
1473 MODULE = IO::AIO PACKAGE = IO::AIO::GRP
1474
1475 void
1476 add (aio_req grp, ...)
1477 PPCODE:
1478 {
1479 int i;
1480 aio_req req;
1481
1482 if (grp->fd == 2)
1483 croak ("cannot add requests to IO::AIO::GRP after the group finished");
1484
1485 for (i = 1; i < items; ++i )
1486 {
1487 if (GIMME_V != G_VOID)
1488 XPUSHs (sv_2mortal (newSVsv (ST (i))));
1489
1490 req = SvAIO_REQ (ST (i));
1491
1492 if (req)
1493 {
1494 ++grp->length;
1495 req->grp = grp;
1496
1497 req->grp_prev = 0;
1498 req->grp_next = grp->grp_first;
1499
1500 if (grp->grp_first)
1501 grp->grp_first->grp_prev = req;
1502
1503 grp->grp_first = req;
1504 }
1505 }
1506 }
1507
1508 void
1509 cancel_subs (aio_req_ornot req)
1510 CODE:
1511 req_cancel_subs (req);
1512
1513 void
1514 result (aio_req grp, ...)
1515 CODE:
1516 {
1517 int i;
1518 AV *av = newAV ();
1519
1520 for (i = 1; i < items; ++i )
1521 av_push (av, newSVsv (ST (i)));
1522
1523 SvREFCNT_dec (grp->data);
1524 grp->data = (SV *)av;
1525 }
1526
1527 void
1528 limit (aio_req grp, int limit)
1529 CODE:
1530 grp->fd2 = limit;
1531 aio_grp_feed (grp);
1532
1533 void
1534 feed (aio_req grp, SV *callback=&PL_sv_undef)
1535 CODE:
1536 {
1537 SvREFCNT_dec (grp->fh2);
1538 grp->fh2 = newSVsv (callback);
1539
1540 if (grp->fd2 <= 0)
1541 grp->fd2 = 2;
1542
1543 aio_grp_feed (grp);
1544 }
1545