ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/IO-AIO/AIO.xs
Revision: 1.82
Committed: Fri Oct 27 20:11:58 2006 UTC (17 years, 6 months ago) by root
Branch: MAIN
Changes since 1.81: +2 -0 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 /* solaris */
2 #define _POSIX_PTHREAD_SEMANTICS 1
3
4 #if __linux && !defined(_GNU_SOURCE)
5 # define _GNU_SOURCE
6 #endif
7
8 /* just in case */
9 #define _REENTRANT 1
10
11 #include <errno.h>
12
13 #include "EXTERN.h"
14 #include "perl.h"
15 #include "XSUB.h"
16
17 #include "autoconf/config.h"
18
19 #include <pthread.h>
20
21 #include <stddef.h>
22 #include <errno.h>
23 #include <sys/time.h>
24 #include <sys/select.h>
25 #include <sys/types.h>
26 #include <sys/stat.h>
27 #include <limits.h>
28 #include <unistd.h>
29 #include <fcntl.h>
30 #include <signal.h>
31 #include <sched.h>
32
33 #if HAVE_SENDFILE
34 # if __linux
35 # include <sys/sendfile.h>
36 # elif __freebsd
37 # include <sys/socket.h>
38 # include <sys/uio.h>
39 # elif __hpux
40 # include <sys/socket.h>
41 # elif __solaris /* not yet */
42 # include <sys/sendfile.h>
43 # else
44 # error sendfile support requested but not available
45 # endif
46 #endif
47
48 /* used for struct dirent, AIX doesn't provide it */
49 #ifndef NAME_MAX
50 # define NAME_MAX 4096
51 #endif
52
53 #ifndef PTHREAD_STACK_MIN
54 /* care for broken platforms, e.g. windows */
55 # define PTHREAD_STACK_MIN 16384
56 #endif
57
58 #if __ia64
59 # define STACKSIZE 65536
60 #elif __i386 || __x86_64 /* 16k is unreasonably high :( */
61 # define STACKSIZE PTHREAD_STACK_MIN
62 #else
63 # define STACKSIZE 16384
64 #endif
65
66 /* wether word reads are potentially non-atomic.
67 * this is conservatice, likely most arches this runs
68 * on have atomic word read/writes.
69 */
70 #ifndef WORDREAD_UNSAFE
71 # if __i386 || __x86_64
72 # define WORDREAD_UNSAFE 0
73 # else
74 # define WORDREAD_UNSAFE 1
75 # endif
76 #endif
77
78 /* buffer size for various temporary buffers */
79 #define AIO_BUFSIZE 65536
80
81 #define dBUF \
82 char *aio_buf; \
83 LOCK (wrklock); \
84 self->dbuf = aio_buf = malloc (AIO_BUFSIZE); \
85 UNLOCK (wrklock); \
86 if (!aio_buf) \
87 return -1;
88
89 enum {
90 REQ_QUIT,
91 REQ_OPEN, REQ_CLOSE,
92 REQ_READ, REQ_WRITE, REQ_READAHEAD,
93 REQ_SENDFILE,
94 REQ_STAT, REQ_LSTAT, REQ_FSTAT,
95 REQ_FSYNC, REQ_FDATASYNC,
96 REQ_UNLINK, REQ_RMDIR, REQ_RENAME,
97 REQ_MKNOD, REQ_READDIR,
98 REQ_LINK, REQ_SYMLINK,
99 REQ_GROUP, REQ_NOP,
100 REQ_BUSY,
101 };
102
103 #define AIO_REQ_KLASS "IO::AIO::REQ"
104 #define AIO_GRP_KLASS "IO::AIO::GRP"
105
106 typedef struct aio_cb
107 {
108 struct aio_cb *volatile next;
109
110 SV *data, *callback;
111 SV *fh, *fh2;
112 void *dataptr, *data2ptr;
113 Stat_t *statdata;
114 off_t offset;
115 size_t length;
116 ssize_t result;
117
118 STRLEN dataoffset;
119 int type;
120 int fd, fd2;
121 int errorno;
122 mode_t mode; /* open */
123
124 unsigned char flags;
125 unsigned char pri;
126
127 SV *self; /* the perl counterpart of this request, if any */
128 struct aio_cb *grp, *grp_prev, *grp_next, *grp_first;
129 } aio_cb;
130
131 enum {
132 FLAG_CANCELLED = 0x01,
133 };
134
135 typedef aio_cb *aio_req;
136 typedef aio_cb *aio_req_ornot;
137
138 enum {
139 PRI_MIN = -4,
140 PRI_MAX = 4,
141
142 DEFAULT_PRI = 0,
143 PRI_BIAS = -PRI_MIN,
144 NUM_PRI = PRI_MAX + PRI_BIAS + 1,
145 };
146
147 static int next_pri = DEFAULT_PRI + PRI_BIAS;
148
149 static unsigned int started, wanted;
150
151 #if __linux && defined (PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP)
152 # define AIO_MUTEX_INIT PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP
153 #else
154 # define AIO_MUTEX_INIT PTHREAD_MUTEX_INITIALIZER
155 #endif
156
157 #define LOCK(mutex) pthread_mutex_lock (&(mutex))
158 #define UNLOCK(mutex) pthread_mutex_unlock (&(mutex))
159
160 /* worker threads management */
161 static pthread_mutex_t wrklock = AIO_MUTEX_INIT;
162
163 typedef struct worker {
164 /* locked by wrklock */
165 struct worker *prev, *next;
166
167 pthread_t tid;
168
169 /* locked by reslock, reqlock or wrklock */
170 aio_req req; /* currently processed request */
171 void *dbuf;
172 DIR *dirp;
173 } worker;
174
175 static worker wrk_first = { &wrk_first, &wrk_first, 0 };
176
177 static void worker_clear (worker *wrk)
178 {
179 if (wrk->dirp)
180 {
181 closedir (wrk->dirp);
182 wrk->dirp = 0;
183 }
184
185 if (wrk->dbuf)
186 {
187 free (wrk->dbuf);
188 wrk->dbuf = 0;
189 }
190 }
191
192 static void worker_free (worker *wrk)
193 {
194 wrk->next->prev = wrk->prev;
195 wrk->prev->next = wrk->next;
196
197 free (wrk);
198 }
199
200 static volatile unsigned int nreqs, nready, npending;
201 static volatile unsigned int max_outstanding = 0xffffffff;
202 static int respipe [2];
203
204 static pthread_mutex_t reslock = AIO_MUTEX_INIT;
205 static pthread_mutex_t reqlock = AIO_MUTEX_INIT;
206 static pthread_cond_t reqwait = PTHREAD_COND_INITIALIZER;
207
208 #if WORDREAD_UNSAFE
209
210 static unsigned int get_nready ()
211 {
212 unsigned int retval;
213
214 LOCK (reqlock);
215 retval = nready;
216 UNLOCK (reqlock);
217
218 return retval;
219 }
220
221 static unsigned int get_npending ()
222 {
223 unsigned int retval;
224
225 LOCK (reslock);
226 retval = npending;
227 UNLOCK (reslock);
228
229 return retval;
230 }
231
232 #else
233
234 # define get_nready() nready
235 # define get_npending() npending
236
237 #endif
238
239 /*
240 * a somewhat faster data structure might be nice, but
241 * with 8 priorities this actually needs <20 insns
242 * per shift, the most expensive operation.
243 */
244 typedef struct {
245 aio_req qs[NUM_PRI], qe[NUM_PRI]; /* qstart, qend */
246 int size;
247 } reqq;
248
249 static reqq req_queue;
250 static reqq res_queue;
251
252 int reqq_push (reqq *q, aio_req req)
253 {
254 int pri = req->pri;
255 req->next = 0;
256
257 if (q->qe[pri])
258 {
259 q->qe[pri]->next = req;
260 q->qe[pri] = req;
261 }
262 else
263 q->qe[pri] = q->qs[pri] = req;
264
265 return q->size++;
266 }
267
268 aio_req reqq_shift (reqq *q)
269 {
270 int pri;
271
272 if (!q->size)
273 return 0;
274
275 --q->size;
276
277 for (pri = NUM_PRI; pri--; )
278 {
279 aio_req req = q->qs[pri];
280
281 if (req)
282 {
283 if (!(q->qs[pri] = req->next))
284 q->qe[pri] = 0;
285
286 return req;
287 }
288 }
289
290 abort ();
291 }
292
293 static int poll_cb (int max);
294 static void req_invoke (aio_req req);
295 static void req_free (aio_req req);
296 static void req_cancel (aio_req req);
297
298 /* must be called at most once */
299 static SV *req_sv (aio_req req, const char *klass)
300 {
301 if (!req->self)
302 {
303 req->self = (SV *)newHV ();
304 sv_magic (req->self, 0, PERL_MAGIC_ext, (char *)req, 0);
305 }
306
307 return sv_2mortal (sv_bless (newRV_inc (req->self), gv_stashpv (klass, 1)));
308 }
309
310 static aio_req SvAIO_REQ (SV *sv)
311 {
312 MAGIC *mg;
313
314 if (!sv_derived_from (sv, AIO_REQ_KLASS) || !SvROK (sv))
315 croak ("object of class " AIO_REQ_KLASS " expected");
316
317 mg = mg_find (SvRV (sv), PERL_MAGIC_ext);
318
319 return mg ? (aio_req)mg->mg_ptr : 0;
320 }
321
322 static void aio_grp_feed (aio_req grp)
323 {
324 while (grp->length < grp->fd2 && !(grp->flags & FLAG_CANCELLED))
325 {
326 int old_len = grp->length;
327
328 if (grp->fh2 && SvOK (grp->fh2))
329 {
330 dSP;
331
332 ENTER;
333 SAVETMPS;
334 PUSHMARK (SP);
335 XPUSHs (req_sv (grp, AIO_GRP_KLASS));
336 PUTBACK;
337 call_sv (grp->fh2, G_VOID | G_EVAL | G_KEEPERR);
338 SPAGAIN;
339 FREETMPS;
340 LEAVE;
341 }
342
343 /* stop if no progress has been made */
344 if (old_len == grp->length)
345 {
346 SvREFCNT_dec (grp->fh2);
347 grp->fh2 = 0;
348 break;
349 }
350 }
351 }
352
353 static void aio_grp_dec (aio_req grp)
354 {
355 --grp->length;
356
357 /* call feeder, if applicable */
358 aio_grp_feed (grp);
359
360 /* finish, if done */
361 if (!grp->length && grp->fd)
362 {
363 req_invoke (grp);
364 req_free (grp);
365 }
366 }
367
368 static void req_invoke (aio_req req)
369 {
370 dSP;
371
372 if (!(req->flags & FLAG_CANCELLED) && SvOK (req->callback))
373 {
374 ENTER;
375 SAVETMPS;
376 PUSHMARK (SP);
377 EXTEND (SP, 1);
378
379 switch (req->type)
380 {
381 case REQ_READDIR:
382 {
383 SV *rv = &PL_sv_undef;
384
385 if (req->result >= 0)
386 {
387 int i;
388 char *buf = req->data2ptr;
389 AV *av = newAV ();
390
391 av_extend (av, req->result - 1);
392
393 for (i = 0; i < req->result; ++i)
394 {
395 SV *sv = newSVpv (buf, 0);
396
397 av_store (av, i, sv);
398 buf += SvCUR (sv) + 1;
399 }
400
401 rv = sv_2mortal (newRV_noinc ((SV *)av));
402 }
403
404 PUSHs (rv);
405 }
406 break;
407
408 case REQ_OPEN:
409 {
410 /* convert fd to fh */
411 SV *fh;
412
413 PUSHs (sv_2mortal (newSViv (req->result)));
414 PUTBACK;
415 call_pv ("IO::AIO::_fd2fh", G_SCALAR | G_EVAL);
416 SPAGAIN;
417
418 fh = SvREFCNT_inc (POPs);
419
420 PUSHMARK (SP);
421 XPUSHs (sv_2mortal (fh));
422 }
423 break;
424
425 case REQ_GROUP:
426 req->fd = 2; /* mark group as finished */
427
428 if (req->data)
429 {
430 int i;
431 AV *av = (AV *)req->data;
432
433 EXTEND (SP, AvFILL (av) + 1);
434 for (i = 0; i <= AvFILL (av); ++i)
435 PUSHs (*av_fetch (av, i, 0));
436 }
437 break;
438
439 case REQ_NOP:
440 case REQ_BUSY:
441 break;
442
443 default:
444 PUSHs (sv_2mortal (newSViv (req->result)));
445 break;
446 }
447
448 errno = req->errorno;
449
450 PUTBACK;
451 call_sv (req->callback, G_VOID | G_EVAL);
452 SPAGAIN;
453
454 FREETMPS;
455 LEAVE;
456 }
457
458 if (req->grp)
459 {
460 aio_req grp = req->grp;
461
462 /* unlink request */
463 if (req->grp_next) req->grp_next->grp_prev = req->grp_prev;
464 if (req->grp_prev) req->grp_prev->grp_next = req->grp_next;
465
466 if (grp->grp_first == req)
467 grp->grp_first = req->grp_next;
468
469 aio_grp_dec (grp);
470 }
471
472 if (SvTRUE (ERRSV))
473 {
474 req_free (req);
475 croak (0);
476 }
477 }
478
479 static void req_free (aio_req req)
480 {
481 if (req->self)
482 {
483 sv_unmagic (req->self, PERL_MAGIC_ext);
484 SvREFCNT_dec (req->self);
485 }
486
487 SvREFCNT_dec (req->data);
488 SvREFCNT_dec (req->fh);
489 SvREFCNT_dec (req->fh2);
490 SvREFCNT_dec (req->callback);
491 Safefree (req->statdata);
492
493 if (req->type == REQ_READDIR)
494 free (req->data2ptr);
495
496 Safefree (req);
497 }
498
499 static void req_cancel_subs (aio_req grp)
500 {
501 aio_req sub;
502
503 if (grp->type != REQ_GROUP)
504 return;
505
506 SvREFCNT_dec (grp->fh2);
507 grp->fh2 = 0;
508
509 for (sub = grp->grp_first; sub; sub = sub->grp_next)
510 req_cancel (sub);
511 }
512
513 static void req_cancel (aio_req req)
514 {
515 req->flags |= FLAG_CANCELLED;
516
517 req_cancel_subs (req);
518 }
519
520 static void *aio_proc(void *arg);
521
522 static void start_thread (void)
523 {
524 sigset_t fullsigset, oldsigset;
525 pthread_attr_t attr;
526
527 worker *wrk = calloc (1, sizeof (worker));
528
529 if (!wrk)
530 croak ("unable to allocate worker thread data");
531
532 pthread_attr_init (&attr);
533 pthread_attr_setstacksize (&attr, STACKSIZE);
534 pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED);
535 #ifdef PTHREAD_SCOPE_PROCESS
536 pthread_attr_setscope (&attr, PTHREAD_SCOPE_PROCESS);
537 #endif
538
539 sigfillset (&fullsigset);
540
541 LOCK (wrklock);
542 sigprocmask (SIG_SETMASK, &fullsigset, &oldsigset);
543
544 if (pthread_create (&wrk->tid, &attr, aio_proc, (void *)wrk) == 0)
545 {
546 wrk->prev = &wrk_first;
547 wrk->next = wrk_first.next;
548 wrk_first.next->prev = wrk;
549 wrk_first.next = wrk;
550 ++started;
551 }
552 else
553 free (wrk);
554
555 sigprocmask (SIG_SETMASK, &oldsigset, 0);
556 UNLOCK (wrklock);
557 }
558
559 static void maybe_start_thread ()
560 {
561 #if 0
562 static struct timeval last;
563 struct timeval diff, now;
564 #endif
565
566 if (started >= wanted)
567 return;
568
569 if (nready <= nreqs - get_nready () - get_npending ())
570 return;
571
572 #if 0
573 gettimeofday (&now, 0);
574
575 diff.tv_sec = now.tv_sec - last.tv_sec;
576 diff.tv_usec = now.tv_usec - last.tv_usec;
577
578 if (diff.tv_usec < 0)
579 {
580 --diff.tv_sec;
581 diff.tv_usec += 1000000;
582 }
583
584 if (!diff.tv_sec && diff.tv_usec < 10000)
585 return;
586
587 last = now;
588 #endif
589
590 start_thread ();
591 }
592
593 static void req_send (aio_req req)
594 {
595 ++nreqs;
596
597 LOCK (reqlock);
598 ++nready;
599 reqq_push (&req_queue, req);
600 pthread_cond_signal (&reqwait);
601 UNLOCK (reqlock);
602
603 maybe_start_thread ();
604 }
605
606 static void end_thread (void)
607 {
608 aio_req req;
609
610 Newz (0, req, 1, aio_cb);
611
612 req->type = REQ_QUIT;
613 req->pri = PRI_MAX + PRI_BIAS;
614
615 req_send (req);
616
617 LOCK (wrklock);
618 --started;
619 UNLOCK (wrklock);
620 }
621
622 static void min_parallel (int nthreads)
623 {
624 if (wanted < nthreads)
625 wanted = nthreads;
626 }
627
628 static void max_parallel (int nthreads)
629 {
630 if (wanted > nthreads)
631 wanted = nthreads;
632
633 while (started > wanted)
634 end_thread ();
635 }
636
637 static void poll_wait ()
638 {
639 fd_set rfd;
640
641 while (nreqs)
642 {
643 int size;
644 if (WORDREAD_UNSAFE) LOCK (reslock);
645 size = res_queue.size;
646 if (WORDREAD_UNSAFE) UNLOCK (reslock);
647
648 if (size)
649 return;
650
651 maybe_start_thread ();
652
653 FD_ZERO(&rfd);
654 FD_SET(respipe [0], &rfd);
655
656 select (respipe [0] + 1, &rfd, 0, 0, 0);
657 }
658 }
659
660 static int poll_cb (int max)
661 {
662 dSP;
663 int count = 0;
664 int do_croak = 0;
665 aio_req req;
666
667 for (;;)
668 {
669 while (max <= 0 || count < max)
670 {
671 maybe_start_thread ();
672
673 LOCK (reslock);
674 req = reqq_shift (&res_queue);
675
676 if (req)
677 {
678 --npending;
679
680 if (!res_queue.size)
681 {
682 /* read any signals sent by the worker threads */
683 char buf [32];
684 while (read (respipe [0], buf, 32) == 32)
685 ;
686 }
687 }
688
689 UNLOCK (reslock);
690
691 if (!req)
692 break;
693
694 --nreqs;
695
696 if (req->type == REQ_GROUP && req->length)
697 {
698 req->fd = 1; /* mark request as delayed */
699 continue;
700 }
701 else
702 {
703 if (req->type == REQ_READ)
704 SvCUR_set (req->data, req->dataoffset + (req->result > 0 ? req->result : 0));
705
706 if (req->data2ptr && (req->type == REQ_READ || req->type == REQ_WRITE))
707 SvREADONLY_off (req->data);
708
709 if (req->statdata)
710 {
711 PL_laststype = req->type == REQ_LSTAT ? OP_LSTAT : OP_STAT;
712 PL_laststatval = req->result;
713 PL_statcache = *(req->statdata);
714 }
715
716 req_invoke (req);
717
718 count++;
719 }
720
721 req_free (req);
722 }
723
724 if (nreqs <= max_outstanding)
725 break;
726
727 poll_wait ();
728
729 max = 0;
730 }
731
732 return count;
733 }
734
735 static void create_pipe ()
736 {
737 if (pipe (respipe))
738 croak ("unable to initialize result pipe");
739
740 if (fcntl (respipe [0], F_SETFL, O_NONBLOCK))
741 croak ("cannot set result pipe to nonblocking mode");
742
743 if (fcntl (respipe [1], F_SETFL, O_NONBLOCK))
744 croak ("cannot set result pipe to nonblocking mode");
745 }
746
747 /*****************************************************************************/
748 /* work around various missing functions */
749
750 #if !HAVE_PREADWRITE
751 # define pread aio_pread
752 # define pwrite aio_pwrite
753
754 /*
755 * make our pread/pwrite safe against themselves, but not against
756 * normal read/write by using a mutex. slows down execution a lot,
757 * but that's your problem, not mine.
758 */
759 static pthread_mutex_t preadwritelock = PTHREAD_MUTEX_INITIALIZER;
760
761 static ssize_t pread (int fd, void *buf, size_t count, off_t offset)
762 {
763 ssize_t res;
764 off_t ooffset;
765
766 LOCK (preadwritelock);
767 ooffset = lseek (fd, 0, SEEK_CUR);
768 lseek (fd, offset, SEEK_SET);
769 res = read (fd, buf, count);
770 lseek (fd, ooffset, SEEK_SET);
771 UNLOCK (preadwritelock);
772
773 return res;
774 }
775
776 static ssize_t pwrite (int fd, void *buf, size_t count, off_t offset)
777 {
778 ssize_t res;
779 off_t ooffset;
780
781 LOCK (preadwritelock);
782 ooffset = lseek (fd, 0, SEEK_CUR);
783 lseek (fd, offset, SEEK_SET);
784 res = write (fd, buf, count);
785 lseek (fd, offset, SEEK_SET);
786 UNLOCK (preadwritelock);
787
788 return res;
789 }
790 #endif
791
792 #if !HAVE_FDATASYNC
793 # define fdatasync fsync
794 #endif
795
796 #if !HAVE_READAHEAD
797 # define readahead(fd,offset,count) aio_readahead (fd, offset, count, self)
798
799 static ssize_t aio_readahead (int fd, off_t offset, size_t count, worker *self)
800 {
801 dBUF;
802
803 while (count > 0)
804 {
805 size_t len = count < AIO_BUFSIZE ? count : AIO_BUFSIZE;
806
807 pread (fd, aio_buf, len, offset);
808 offset += len;
809 count -= len;
810 }
811
812 errno = 0;
813 }
814
815 #endif
816
817 #if !HAVE_READDIR_R
818 # define readdir_r aio_readdir_r
819
820 static pthread_mutex_t readdirlock = PTHREAD_MUTEX_INITIALIZER;
821
822 static int readdir_r (DIR *dirp, struct dirent *ent, struct dirent **res)
823 {
824 struct dirent *e;
825 int errorno;
826
827 LOCK (readdirlock);
828
829 e = readdir (dirp);
830 errorno = errno;
831
832 if (e)
833 {
834 *res = ent;
835 strcpy (ent->d_name, e->d_name);
836 }
837 else
838 *res = 0;
839
840 UNLOCK (readdirlock);
841
842 errno = errorno;
843 return e ? 0 : -1;
844 }
845 #endif
846
847 /* sendfile always needs emulation */
848 static ssize_t sendfile_ (int ofd, int ifd, off_t offset, size_t count, worker *self)
849 {
850 ssize_t res;
851
852 if (!count)
853 return 0;
854
855 #if HAVE_SENDFILE
856 # if __linux
857 res = sendfile (ofd, ifd, &offset, count);
858
859 # elif __freebsd
860 /*
861 * Of course, the freebsd sendfile is a dire hack with no thoughts
862 * wasted on making it similar to other I/O functions.
863 */
864 {
865 off_t sbytes;
866 res = sendfile (ifd, ofd, offset, count, 0, &sbytes, 0);
867
868 if (res < 0 && sbytes)
869 /* maybe only on EAGAIN: as usual, the manpage leaves you guessing */
870 res = sbytes;
871 }
872
873 # elif __hpux
874 res = sendfile (ofd, ifd, offset, count, 0, 0);
875
876 # elif __solaris
877 {
878 struct sendfilevec vec;
879 size_t sbytes;
880
881 vec.sfv_fd = ifd;
882 vec.sfv_flag = 0;
883 vec.sfv_off = offset;
884 vec.sfv_len = count;
885
886 res = sendfilev (ofd, &vec, 1, &sbytes);
887
888 if (res < 0 && sbytes)
889 res = sbytes;
890 }
891
892 # endif
893 #else
894 res = -1;
895 errno = ENOSYS;
896 #endif
897
898 if (res < 0
899 && (errno == ENOSYS || errno == EINVAL || errno == ENOTSOCK
900 #if __solaris
901 || errno == EAFNOSUPPORT || errno == EPROTOTYPE
902 #endif
903 )
904 )
905 {
906 /* emulate sendfile. this is a major pain in the ass */
907 dBUF;
908
909 res = 0;
910
911 while (count)
912 {
913 ssize_t cnt;
914
915 cnt = pread (ifd, aio_buf, count > AIO_BUFSIZE ? AIO_BUFSIZE : count, offset);
916
917 if (cnt <= 0)
918 {
919 if (cnt && !res) res = -1;
920 break;
921 }
922
923 cnt = write (ofd, aio_buf, cnt);
924
925 if (cnt <= 0)
926 {
927 if (cnt && !res) res = -1;
928 break;
929 }
930
931 offset += cnt;
932 res += cnt;
933 count -= cnt;
934 }
935 }
936
937 return res;
938 }
939
940 /* read a full directory */
941 static void scandir_ (aio_req req, worker *self)
942 {
943 DIR *dirp;
944 union
945 {
946 struct dirent d;
947 char b [offsetof (struct dirent, d_name) + NAME_MAX + 1];
948 } *u;
949 struct dirent *entp;
950 char *name, *names;
951 int memlen = 4096;
952 int memofs = 0;
953 int res = 0;
954 int errorno;
955
956 LOCK (wrklock);
957 self->dirp = dirp = opendir (req->dataptr);
958 self->dbuf = u = malloc (sizeof (*u));
959 req->data2ptr = names = malloc (memlen);
960 UNLOCK (wrklock);
961
962 if (dirp && u && names)
963 for (;;)
964 {
965 errno = 0;
966 readdir_r (dirp, &u->d, &entp);
967
968 if (!entp)
969 break;
970
971 name = entp->d_name;
972
973 if (name [0] != '.' || (name [1] && (name [1] != '.' || name [2])))
974 {
975 int len = strlen (name) + 1;
976
977 res++;
978
979 while (memofs + len > memlen)
980 {
981 memlen *= 2;
982 LOCK (wrklock);
983 req->data2ptr = names = realloc (names, memlen);
984 UNLOCK (wrklock);
985
986 if (!names)
987 break;
988 }
989
990 memcpy (names + memofs, name, len);
991 memofs += len;
992 }
993 }
994
995 if (errno)
996 res = -1;
997
998 req->result = res;
999 }
1000
1001 /*****************************************************************************/
1002
1003 static void *aio_proc (void *thr_arg)
1004 {
1005 aio_req req;
1006 worker *self = (worker *)thr_arg;
1007
1008 for (;;)
1009 {
1010 LOCK (reqlock);
1011
1012 for (;;)
1013 {
1014 self->req = req = reqq_shift (&req_queue);
1015
1016 if (req)
1017 break;
1018
1019 pthread_cond_wait (&reqwait, &reqlock);
1020 }
1021
1022 --nready;
1023
1024 UNLOCK (reqlock);
1025
1026 errno = 0; /* strictly unnecessary */
1027
1028 if (!(req->flags & FLAG_CANCELLED))
1029 switch (req->type)
1030 {
1031 case REQ_READ: req->result = pread (req->fd, req->dataptr, req->length, req->offset); break;
1032 case REQ_WRITE: req->result = pwrite (req->fd, req->dataptr, req->length, req->offset); break;
1033
1034 case REQ_READAHEAD: req->result = readahead (req->fd, req->offset, req->length); break;
1035 case REQ_SENDFILE: req->result = sendfile_ (req->fd, req->fd2, req->offset, req->length, self); break;
1036
1037 case REQ_STAT: req->result = stat (req->dataptr, req->statdata); break;
1038 case REQ_LSTAT: req->result = lstat (req->dataptr, req->statdata); break;
1039 case REQ_FSTAT: req->result = fstat (req->fd , req->statdata); break;
1040
1041 case REQ_OPEN: req->result = open (req->dataptr, req->fd, req->mode); break;
1042 case REQ_CLOSE: req->result = close (req->fd); break;
1043 case REQ_UNLINK: req->result = unlink (req->dataptr); break;
1044 case REQ_RMDIR: req->result = rmdir (req->dataptr); break;
1045 case REQ_RENAME: req->result = rename (req->data2ptr, req->dataptr); break;
1046 case REQ_LINK: req->result = link (req->data2ptr, req->dataptr); break;
1047 case REQ_SYMLINK: req->result = symlink (req->data2ptr, req->dataptr); break;
1048 case REQ_MKNOD: req->result = mknod (req->data2ptr, req->mode, (dev_t)req->offset); break;
1049
1050 case REQ_FDATASYNC: req->result = fdatasync (req->fd); break;
1051 case REQ_FSYNC: req->result = fsync (req->fd); break;
1052 case REQ_READDIR: scandir_ (req, self); break;
1053
1054 case REQ_BUSY:
1055 {
1056 struct timeval tv;
1057
1058 tv.tv_sec = req->fd;
1059 tv.tv_usec = req->fd2;
1060
1061 req->result = select (0, 0, 0, 0, &tv);
1062 }
1063
1064 case REQ_GROUP:
1065 case REQ_NOP:
1066 break;
1067
1068 case REQ_QUIT:
1069 LOCK (wrklock);
1070 worker_free (self);
1071 --started;
1072 UNLOCK (wrklock);
1073 return 0;
1074
1075 default:
1076 req->result = ENOSYS;
1077 break;
1078 }
1079
1080 req->errorno = errno;
1081
1082 LOCK (reslock);
1083
1084 ++npending;
1085
1086 if (!reqq_push (&res_queue, req))
1087 /* write a dummy byte to the pipe so fh becomes ready */
1088 write (respipe [1], &respipe, 1);
1089
1090 self->req = 0;
1091 worker_clear (self);
1092
1093 UNLOCK (reslock);
1094 }
1095 }
1096
1097 /*****************************************************************************/
1098
1099 static void atfork_prepare (void)
1100 {
1101 LOCK (wrklock);
1102 LOCK (reqlock);
1103 LOCK (reslock);
1104 #if !HAVE_PREADWRITE
1105 LOCK (preadwritelock);
1106 #endif
1107 #if !HAVE_READDIR_R
1108 LOCK (readdirlock);
1109 #endif
1110 }
1111
1112 static void atfork_parent (void)
1113 {
1114 #if !HAVE_READDIR_R
1115 UNLOCK (readdirlock);
1116 #endif
1117 #if !HAVE_PREADWRITE
1118 UNLOCK (preadwritelock);
1119 #endif
1120 UNLOCK (reslock);
1121 UNLOCK (reqlock);
1122 UNLOCK (wrklock);
1123 }
1124
1125 static void atfork_child (void)
1126 {
1127 aio_req prv;
1128
1129 while (prv = reqq_shift (&req_queue))
1130 req_free (prv);
1131
1132 while (prv = reqq_shift (&res_queue))
1133 req_free (prv);
1134
1135 while (wrk_first.next != &wrk_first)
1136 {
1137 worker *wrk = wrk_first.next;
1138
1139 if (wrk->req)
1140 req_free (wrk->req);
1141
1142 worker_clear (wrk);
1143 worker_free (wrk);
1144 }
1145
1146 started = 0;
1147 nreqs = 0;
1148
1149 close (respipe [0]);
1150 close (respipe [1]);
1151 create_pipe ();
1152
1153 atfork_parent ();
1154 }
1155
1156 #define dREQ \
1157 aio_req req; \
1158 int req_pri = next_pri; \
1159 next_pri = DEFAULT_PRI + PRI_BIAS; \
1160 \
1161 if (SvOK (callback) && !SvROK (callback)) \
1162 croak ("callback must be undef or of reference type"); \
1163 \
1164 Newz (0, req, 1, aio_cb); \
1165 if (!req) \
1166 croak ("out of memory during aio_req allocation"); \
1167 \
1168 req->callback = newSVsv (callback); \
1169 req->pri = req_pri
1170
1171 #define REQ_SEND \
1172 req_send (req); \
1173 \
1174 if (GIMME_V != G_VOID) \
1175 XPUSHs (req_sv (req, AIO_REQ_KLASS));
1176
1177 MODULE = IO::AIO PACKAGE = IO::AIO
1178
1179 PROTOTYPES: ENABLE
1180
1181 BOOT:
1182 {
1183 HV *stash = gv_stashpv ("IO::AIO", 1);
1184
1185 newCONSTSUB (stash, "EXDEV", newSViv (EXDEV));
1186 newCONSTSUB (stash, "O_RDONLY", newSViv (O_RDONLY));
1187 newCONSTSUB (stash, "O_WRONLY", newSViv (O_WRONLY));
1188 newCONSTSUB (stash, "O_CREAT", newSViv (O_CREAT));
1189 newCONSTSUB (stash, "O_TRUNC", newSViv (O_TRUNC));
1190 newCONSTSUB (stash, "S_IFIFO", newSViv (S_IFIFO));
1191
1192 create_pipe ();
1193 pthread_atfork (atfork_prepare, atfork_parent, atfork_child);
1194
1195 start_thread ();
1196 }
1197
1198 void
1199 min_parallel (int nthreads)
1200 PROTOTYPE: $
1201
1202 void
1203 max_parallel (int nthreads)
1204 PROTOTYPE: $
1205
1206 int
1207 max_outstanding (int maxreqs)
1208 PROTOTYPE: $
1209 CODE:
1210 RETVAL = max_outstanding;
1211 max_outstanding = maxreqs;
1212 OUTPUT:
1213 RETVAL
1214
1215 void
1216 aio_open (pathname,flags,mode,callback=&PL_sv_undef)
1217 SV * pathname
1218 int flags
1219 int mode
1220 SV * callback
1221 PROTOTYPE: $$$;$
1222 PPCODE:
1223 {
1224 dREQ;
1225
1226 req->type = REQ_OPEN;
1227 req->data = newSVsv (pathname);
1228 req->dataptr = SvPVbyte_nolen (req->data);
1229 req->fd = flags;
1230 req->mode = mode;
1231
1232 REQ_SEND;
1233 }
1234
1235 void
1236 aio_close (fh,callback=&PL_sv_undef)
1237 SV * fh
1238 SV * callback
1239 PROTOTYPE: $;$
1240 ALIAS:
1241 aio_close = REQ_CLOSE
1242 aio_fsync = REQ_FSYNC
1243 aio_fdatasync = REQ_FDATASYNC
1244 PPCODE:
1245 {
1246 dREQ;
1247
1248 req->type = ix;
1249 req->fh = newSVsv (fh);
1250 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh)));
1251
1252 REQ_SEND (req);
1253 }
1254
1255 void
1256 aio_read (fh,offset,length,data,dataoffset,callback=&PL_sv_undef)
1257 SV * fh
1258 UV offset
1259 UV length
1260 SV * data
1261 UV dataoffset
1262 SV * callback
1263 ALIAS:
1264 aio_read = REQ_READ
1265 aio_write = REQ_WRITE
1266 PROTOTYPE: $$$$$;$
1267 PPCODE:
1268 {
1269 aio_req req;
1270 STRLEN svlen;
1271 char *svptr = SvPVbyte (data, svlen);
1272
1273 SvUPGRADE (data, SVt_PV);
1274 SvPOK_on (data);
1275
1276 if (dataoffset < 0)
1277 dataoffset += svlen;
1278
1279 if (dataoffset < 0 || dataoffset > svlen)
1280 croak ("data offset outside of string");
1281
1282 if (ix == REQ_WRITE)
1283 {
1284 /* write: check length and adjust. */
1285 if (length < 0 || length + dataoffset > svlen)
1286 length = svlen - dataoffset;
1287 }
1288 else
1289 {
1290 /* read: grow scalar as necessary */
1291 svptr = SvGROW (data, length + dataoffset);
1292 }
1293
1294 if (length < 0)
1295 croak ("length must not be negative");
1296
1297 {
1298 dREQ;
1299
1300 req->type = ix;
1301 req->fh = newSVsv (fh);
1302 req->fd = PerlIO_fileno (ix == REQ_READ ? IoIFP (sv_2io (fh))
1303 : IoOFP (sv_2io (fh)));
1304 req->offset = offset;
1305 req->length = length;
1306 req->data = SvREFCNT_inc (data);
1307 req->dataptr = (char *)svptr + dataoffset;
1308
1309 if (!SvREADONLY (data))
1310 {
1311 SvREADONLY_on (data);
1312 req->data2ptr = (void *)data;
1313 }
1314
1315 REQ_SEND;
1316 }
1317 }
1318
1319 void
1320 aio_sendfile (out_fh,in_fh,in_offset,length,callback=&PL_sv_undef)
1321 SV * out_fh
1322 SV * in_fh
1323 UV in_offset
1324 UV length
1325 SV * callback
1326 PROTOTYPE: $$$$;$
1327 PPCODE:
1328 {
1329 dREQ;
1330
1331 req->type = REQ_SENDFILE;
1332 req->fh = newSVsv (out_fh);
1333 req->fd = PerlIO_fileno (IoIFP (sv_2io (out_fh)));
1334 req->fh2 = newSVsv (in_fh);
1335 req->fd2 = PerlIO_fileno (IoIFP (sv_2io (in_fh)));
1336 req->offset = in_offset;
1337 req->length = length;
1338
1339 REQ_SEND;
1340 }
1341
1342 void
1343 aio_readahead (fh,offset,length,callback=&PL_sv_undef)
1344 SV * fh
1345 UV offset
1346 IV length
1347 SV * callback
1348 PROTOTYPE: $$$;$
1349 PPCODE:
1350 {
1351 dREQ;
1352
1353 req->type = REQ_READAHEAD;
1354 req->fh = newSVsv (fh);
1355 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh)));
1356 req->offset = offset;
1357 req->length = length;
1358
1359 REQ_SEND;
1360 }
1361
1362 void
1363 aio_stat (fh_or_path,callback=&PL_sv_undef)
1364 SV * fh_or_path
1365 SV * callback
1366 ALIAS:
1367 aio_stat = REQ_STAT
1368 aio_lstat = REQ_LSTAT
1369 PPCODE:
1370 {
1371 dREQ;
1372
1373 New (0, req->statdata, 1, Stat_t);
1374 if (!req->statdata)
1375 {
1376 req_free (req);
1377 croak ("out of memory during aio_req->statdata allocation");
1378 }
1379
1380 if (SvPOK (fh_or_path))
1381 {
1382 req->type = ix;
1383 req->data = newSVsv (fh_or_path);
1384 req->dataptr = SvPVbyte_nolen (req->data);
1385 }
1386 else
1387 {
1388 req->type = REQ_FSTAT;
1389 req->fh = newSVsv (fh_or_path);
1390 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh_or_path)));
1391 }
1392
1393 REQ_SEND;
1394 }
1395
1396 void
1397 aio_unlink (pathname,callback=&PL_sv_undef)
1398 SV * pathname
1399 SV * callback
1400 ALIAS:
1401 aio_unlink = REQ_UNLINK
1402 aio_rmdir = REQ_RMDIR
1403 aio_readdir = REQ_READDIR
1404 PPCODE:
1405 {
1406 dREQ;
1407
1408 req->type = ix;
1409 req->data = newSVsv (pathname);
1410 req->dataptr = SvPVbyte_nolen (req->data);
1411
1412 REQ_SEND;
1413 }
1414
1415 void
1416 aio_link (oldpath,newpath,callback=&PL_sv_undef)
1417 SV * oldpath
1418 SV * newpath
1419 SV * callback
1420 ALIAS:
1421 aio_link = REQ_LINK
1422 aio_symlink = REQ_SYMLINK
1423 aio_rename = REQ_RENAME
1424 PPCODE:
1425 {
1426 dREQ;
1427
1428 req->type = ix;
1429 req->fh = newSVsv (oldpath);
1430 req->data2ptr = SvPVbyte_nolen (req->fh);
1431 req->data = newSVsv (newpath);
1432 req->dataptr = SvPVbyte_nolen (req->data);
1433
1434 REQ_SEND;
1435 }
1436
1437 void
1438 aio_mknod (pathname,mode,dev,callback=&PL_sv_undef)
1439 SV * pathname
1440 SV * callback
1441 UV mode
1442 UV dev
1443 PPCODE:
1444 {
1445 dREQ;
1446
1447 req->type = REQ_MKNOD;
1448 req->data = newSVsv (pathname);
1449 req->dataptr = SvPVbyte_nolen (req->data);
1450 req->mode = (mode_t)mode;
1451 req->offset = dev;
1452
1453 REQ_SEND;
1454 }
1455
1456 void
1457 aio_busy (delay,callback=&PL_sv_undef)
1458 double delay
1459 SV * callback
1460 PPCODE:
1461 {
1462 dREQ;
1463
1464 req->type = REQ_BUSY;
1465 req->fd = delay < 0. ? 0 : delay;
1466 req->fd2 = delay < 0. ? 0 : 1000. * (delay - req->fd);
1467
1468 REQ_SEND;
1469 }
1470
1471 void
1472 aio_group (callback=&PL_sv_undef)
1473 SV * callback
1474 PROTOTYPE: ;$
1475 PPCODE:
1476 {
1477 dREQ;
1478
1479 req->type = REQ_GROUP;
1480 req_send (req);
1481
1482 XPUSHs (req_sv (req, AIO_GRP_KLASS));
1483 }
1484
1485 void
1486 aio_nop (callback=&PL_sv_undef)
1487 SV * callback
1488 PPCODE:
1489 {
1490 dREQ;
1491
1492 req->type = REQ_NOP;
1493
1494 REQ_SEND;
1495 }
1496
1497 int
1498 aioreq_pri (int pri = 0)
1499 PROTOTYPE: ;$
1500 CODE:
1501 RETVAL = next_pri - PRI_BIAS;
1502 if (items > 0)
1503 {
1504 if (pri < PRI_MIN) pri = PRI_MIN;
1505 if (pri > PRI_MAX) pri = PRI_MAX;
1506 next_pri = pri + PRI_BIAS;
1507 }
1508 OUTPUT:
1509 RETVAL
1510
1511 void
1512 aioreq_nice (int nice = 0)
1513 CODE:
1514 nice = next_pri - nice;
1515 if (nice < PRI_MIN) nice = PRI_MIN;
1516 if (nice > PRI_MAX) nice = PRI_MAX;
1517 next_pri = nice + PRI_BIAS;
1518
1519 void
1520 flush ()
1521 PROTOTYPE:
1522 CODE:
1523 while (nreqs)
1524 {
1525 poll_wait ();
1526 poll_cb (0);
1527 }
1528
1529 void
1530 poll()
1531 PROTOTYPE:
1532 CODE:
1533 if (nreqs)
1534 {
1535 poll_wait ();
1536 poll_cb (0);
1537 }
1538
1539 int
1540 poll_fileno()
1541 PROTOTYPE:
1542 CODE:
1543 RETVAL = respipe [0];
1544 OUTPUT:
1545 RETVAL
1546
1547 int
1548 poll_cb(...)
1549 PROTOTYPE:
1550 CODE:
1551 RETVAL = poll_cb (0);
1552 OUTPUT:
1553 RETVAL
1554
1555 int
1556 poll_some(int max = 0)
1557 PROTOTYPE: $
1558 CODE:
1559 RETVAL = poll_cb (max);
1560 OUTPUT:
1561 RETVAL
1562
1563 void
1564 poll_wait()
1565 PROTOTYPE:
1566 CODE:
1567 if (nreqs)
1568 poll_wait ();
1569
1570 int
1571 nreqs()
1572 PROTOTYPE:
1573 CODE:
1574 RETVAL = nreqs;
1575 OUTPUT:
1576 RETVAL
1577
1578 int
1579 nready()
1580 PROTOTYPE:
1581 CODE:
1582 RETVAL = get_nready ();
1583 OUTPUT:
1584 RETVAL
1585
1586 int
1587 npending()
1588 PROTOTYPE:
1589 CODE:
1590 RETVAL = get_npending ();
1591 OUTPUT:
1592 RETVAL
1593
1594 PROTOTYPES: DISABLE
1595
1596 MODULE = IO::AIO PACKAGE = IO::AIO::REQ
1597
1598 void
1599 cancel (aio_req_ornot req)
1600 CODE:
1601 req_cancel (req);
1602
1603 void
1604 cb (aio_req_ornot req, SV *callback=&PL_sv_undef)
1605 CODE:
1606 SvREFCNT_dec (req->callback);
1607 req->callback = newSVsv (callback);
1608
1609 MODULE = IO::AIO PACKAGE = IO::AIO::GRP
1610
1611 void
1612 add (aio_req grp, ...)
1613 PPCODE:
1614 {
1615 int i;
1616 aio_req req;
1617
1618 if (grp->fd == 2)
1619 croak ("cannot add requests to IO::AIO::GRP after the group finished");
1620
1621 for (i = 1; i < items; ++i )
1622 {
1623 if (GIMME_V != G_VOID)
1624 XPUSHs (sv_2mortal (newSVsv (ST (i))));
1625
1626 req = SvAIO_REQ (ST (i));
1627
1628 if (req)
1629 {
1630 ++grp->length;
1631 req->grp = grp;
1632
1633 req->grp_prev = 0;
1634 req->grp_next = grp->grp_first;
1635
1636 if (grp->grp_first)
1637 grp->grp_first->grp_prev = req;
1638
1639 grp->grp_first = req;
1640 }
1641 }
1642 }
1643
1644 void
1645 cancel_subs (aio_req_ornot req)
1646 CODE:
1647 req_cancel_subs (req);
1648
1649 void
1650 result (aio_req grp, ...)
1651 CODE:
1652 {
1653 int i;
1654 AV *av;
1655
1656 grp->errorno = errno;
1657
1658 av = newAV ();
1659
1660 for (i = 1; i < items; ++i )
1661 av_push (av, newSVsv (ST (i)));
1662
1663 SvREFCNT_dec (grp->data);
1664 grp->data = (SV *)av;
1665 }
1666
1667 void
1668 errno (aio_req grp, int errorno = errno)
1669 CODE:
1670 grp->errorno = errorno;
1671
1672 void
1673 limit (aio_req grp, int limit)
1674 CODE:
1675 grp->fd2 = limit;
1676 aio_grp_feed (grp);
1677
1678 void
1679 feed (aio_req grp, SV *callback=&PL_sv_undef)
1680 CODE:
1681 {
1682 SvREFCNT_dec (grp->fh2);
1683 grp->fh2 = newSVsv (callback);
1684
1685 if (grp->fd2 <= 0)
1686 grp->fd2 = 2;
1687
1688 aio_grp_feed (grp);
1689 }
1690