ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/IO-AIO/AIO.xs
Revision: 1.83
Committed: Sat Oct 28 00:17:30 2006 UTC (17 years, 6 months ago) by root
Branch: MAIN
Changes since 1.82: +4 -1 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 /* solaris */
2 #define _POSIX_PTHREAD_SEMANTICS 1
3
4 #if __linux && !defined(_GNU_SOURCE)
5 # define _GNU_SOURCE
6 #endif
7
8 /* just in case */
9 #define _REENTRANT 1
10
11 #include <errno.h>
12
13 #include "EXTERN.h"
14 #include "perl.h"
15 #include "XSUB.h"
16
17 #include "autoconf/config.h"
18
19 #include <pthread.h>
20
21 #include <stddef.h>
22 #include <errno.h>
23 #include <sys/time.h>
24 #include <sys/select.h>
25 #include <sys/types.h>
26 #include <sys/stat.h>
27 #include <limits.h>
28 #include <unistd.h>
29 #include <fcntl.h>
30 #include <signal.h>
31 #include <sched.h>
32
33 #if HAVE_SENDFILE
34 # if __linux
35 # include <sys/sendfile.h>
36 # elif __freebsd
37 # include <sys/socket.h>
38 # include <sys/uio.h>
39 # elif __hpux
40 # include <sys/socket.h>
41 # elif __solaris /* not yet */
42 # include <sys/sendfile.h>
43 # else
44 # error sendfile support requested but not available
45 # endif
46 #endif
47
48 /* used for struct dirent, AIX doesn't provide it */
49 #ifndef NAME_MAX
50 # define NAME_MAX 4096
51 #endif
52
53 #ifndef PTHREAD_STACK_MIN
54 /* care for broken platforms, e.g. windows */
55 # define PTHREAD_STACK_MIN 16384
56 #endif
57
58 #if __ia64
59 # define STACKSIZE 65536
60 #elif __i386 || __x86_64 /* 16k is unreasonably high :( */
61 # define STACKSIZE PTHREAD_STACK_MIN
62 #else
63 # define STACKSIZE 16384
64 #endif
65
66 /* wether word reads are potentially non-atomic.
67 * this is conservatice, likely most arches this runs
68 * on have atomic word read/writes.
69 */
70 #ifndef WORDREAD_UNSAFE
71 # if __i386 || __x86_64
72 # define WORDREAD_UNSAFE 0
73 # else
74 # define WORDREAD_UNSAFE 1
75 # endif
76 #endif
77
78 /* buffer size for various temporary buffers */
79 #define AIO_BUFSIZE 65536
80
81 #define dBUF \
82 char *aio_buf; \
83 LOCK (wrklock); \
84 self->dbuf = aio_buf = malloc (AIO_BUFSIZE); \
85 UNLOCK (wrklock); \
86 if (!aio_buf) \
87 return -1;
88
89 enum {
90 REQ_QUIT,
91 REQ_OPEN, REQ_CLOSE,
92 REQ_READ, REQ_WRITE, REQ_READAHEAD,
93 REQ_SENDFILE,
94 REQ_STAT, REQ_LSTAT, REQ_FSTAT,
95 REQ_FSYNC, REQ_FDATASYNC,
96 REQ_UNLINK, REQ_RMDIR, REQ_RENAME,
97 REQ_MKNOD, REQ_READDIR,
98 REQ_LINK, REQ_SYMLINK,
99 REQ_GROUP, REQ_NOP,
100 REQ_BUSY,
101 };
102
103 #define AIO_REQ_KLASS "IO::AIO::REQ"
104 #define AIO_GRP_KLASS "IO::AIO::GRP"
105
106 typedef struct aio_cb
107 {
108 struct aio_cb *volatile next;
109
110 SV *data, *callback;
111 SV *fh, *fh2;
112 void *dataptr, *data2ptr;
113 Stat_t *statdata;
114 off_t offset;
115 size_t length;
116 ssize_t result;
117
118 STRLEN dataoffset;
119 int type;
120 int fd, fd2;
121 int errorno;
122 mode_t mode; /* open */
123
124 unsigned char flags;
125 unsigned char pri;
126
127 SV *self; /* the perl counterpart of this request, if any */
128 struct aio_cb *grp, *grp_prev, *grp_next, *grp_first;
129 } aio_cb;
130
131 enum {
132 FLAG_CANCELLED = 0x01,
133 };
134
135 typedef aio_cb *aio_req;
136 typedef aio_cb *aio_req_ornot;
137
138 enum {
139 PRI_MIN = -4,
140 PRI_MAX = 4,
141
142 DEFAULT_PRI = 0,
143 PRI_BIAS = -PRI_MIN,
144 NUM_PRI = PRI_MAX + PRI_BIAS + 1,
145 };
146
147 static int next_pri = DEFAULT_PRI + PRI_BIAS;
148
149 static unsigned int started, wanted;
150
151 #if __linux && defined (PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP)
152 # define AIO_MUTEX_INIT PTHREAD_ADAPTIVE_MUTEX_INITIALIZER_NP
153 #else
154 # define AIO_MUTEX_INIT PTHREAD_MUTEX_INITIALIZER
155 #endif
156
157 #define LOCK(mutex) pthread_mutex_lock (&(mutex))
158 #define UNLOCK(mutex) pthread_mutex_unlock (&(mutex))
159
160 /* worker threads management */
161 static pthread_mutex_t wrklock = AIO_MUTEX_INIT;
162
163 typedef struct worker {
164 /* locked by wrklock */
165 struct worker *prev, *next;
166
167 pthread_t tid;
168
169 /* locked by reslock, reqlock or wrklock */
170 aio_req req; /* currently processed request */
171 void *dbuf;
172 DIR *dirp;
173 } worker;
174
175 static worker wrk_first = { &wrk_first, &wrk_first, 0 };
176
177 static void worker_clear (worker *wrk)
178 {
179 if (wrk->dirp)
180 {
181 closedir (wrk->dirp);
182 wrk->dirp = 0;
183 }
184
185 if (wrk->dbuf)
186 {
187 free (wrk->dbuf);
188 wrk->dbuf = 0;
189 }
190 }
191
192 static void worker_free (worker *wrk)
193 {
194 wrk->next->prev = wrk->prev;
195 wrk->prev->next = wrk->next;
196
197 free (wrk);
198 }
199
200 static volatile unsigned int nreqs, nready, npending;
201 static volatile unsigned int max_outstanding = 0xffffffff;
202 static int respipe [2];
203
204 static pthread_mutex_t reslock = AIO_MUTEX_INIT;
205 static pthread_mutex_t reqlock = AIO_MUTEX_INIT;
206 static pthread_cond_t reqwait = PTHREAD_COND_INITIALIZER;
207
208 #if WORDREAD_UNSAFE
209
210 static unsigned int get_nready ()
211 {
212 unsigned int retval;
213
214 LOCK (reqlock);
215 retval = nready;
216 UNLOCK (reqlock);
217
218 return retval;
219 }
220
221 static unsigned int get_npending ()
222 {
223 unsigned int retval;
224
225 LOCK (reslock);
226 retval = npending;
227 UNLOCK (reslock);
228
229 return retval;
230 }
231
232 #else
233
234 # define get_nready() nready
235 # define get_npending() npending
236
237 #endif
238
239 /*
240 * a somewhat faster data structure might be nice, but
241 * with 8 priorities this actually needs <20 insns
242 * per shift, the most expensive operation.
243 */
244 typedef struct {
245 aio_req qs[NUM_PRI], qe[NUM_PRI]; /* qstart, qend */
246 int size;
247 } reqq;
248
249 static reqq req_queue;
250 static reqq res_queue;
251
252 int reqq_push (reqq *q, aio_req req)
253 {
254 int pri = req->pri;
255 req->next = 0;
256
257 if (q->qe[pri])
258 {
259 q->qe[pri]->next = req;
260 q->qe[pri] = req;
261 }
262 else
263 q->qe[pri] = q->qs[pri] = req;
264
265 return q->size++;
266 }
267
268 aio_req reqq_shift (reqq *q)
269 {
270 int pri;
271
272 if (!q->size)
273 return 0;
274
275 --q->size;
276
277 for (pri = NUM_PRI; pri--; )
278 {
279 aio_req req = q->qs[pri];
280
281 if (req)
282 {
283 if (!(q->qs[pri] = req->next))
284 q->qe[pri] = 0;
285
286 return req;
287 }
288 }
289
290 abort ();
291 }
292
293 static int poll_cb (int max);
294 static void req_invoke (aio_req req);
295 static void req_free (aio_req req);
296 static void req_cancel (aio_req req);
297
298 /* must be called at most once */
299 static SV *req_sv (aio_req req, const char *klass)
300 {
301 if (!req->self)
302 {
303 req->self = (SV *)newHV ();
304 sv_magic (req->self, 0, PERL_MAGIC_ext, (char *)req, 0);
305 }
306
307 return sv_2mortal (sv_bless (newRV_inc (req->self), gv_stashpv (klass, 1)));
308 }
309
310 static aio_req SvAIO_REQ (SV *sv)
311 {
312 MAGIC *mg;
313
314 if (!sv_derived_from (sv, AIO_REQ_KLASS) || !SvROK (sv))
315 croak ("object of class " AIO_REQ_KLASS " expected");
316
317 mg = mg_find (SvRV (sv), PERL_MAGIC_ext);
318
319 return mg ? (aio_req)mg->mg_ptr : 0;
320 }
321
322 static void aio_grp_feed (aio_req grp)
323 {
324 while (grp->length < grp->fd2 && !(grp->flags & FLAG_CANCELLED))
325 {
326 int old_len = grp->length;
327
328 if (grp->fh2 && SvOK (grp->fh2))
329 {
330 dSP;
331
332 ENTER;
333 SAVETMPS;
334 PUSHMARK (SP);
335 XPUSHs (req_sv (grp, AIO_GRP_KLASS));
336 PUTBACK;
337 call_sv (grp->fh2, G_VOID | G_EVAL | G_KEEPERR);
338 SPAGAIN;
339 FREETMPS;
340 LEAVE;
341 }
342
343 /* stop if no progress has been made */
344 if (old_len == grp->length)
345 {
346 SvREFCNT_dec (grp->fh2);
347 grp->fh2 = 0;
348 break;
349 }
350 }
351 }
352
353 static void aio_grp_dec (aio_req grp)
354 {
355 --grp->length;
356
357 /* call feeder, if applicable */
358 aio_grp_feed (grp);
359
360 /* finish, if done */
361 if (!grp->length && grp->fd)
362 {
363 req_invoke (grp);
364 req_free (grp);
365 }
366 }
367
368 static void req_invoke (aio_req req)
369 {
370 dSP;
371
372 if (!(req->flags & FLAG_CANCELLED) && SvOK (req->callback))
373 {
374 ENTER;
375 SAVETMPS;
376 PUSHMARK (SP);
377 EXTEND (SP, 1);
378
379 switch (req->type)
380 {
381 case REQ_READDIR:
382 {
383 SV *rv = &PL_sv_undef;
384
385 if (req->result >= 0)
386 {
387 int i;
388 char *buf = req->data2ptr;
389 AV *av = newAV ();
390
391 av_extend (av, req->result - 1);
392
393 for (i = 0; i < req->result; ++i)
394 {
395 SV *sv = newSVpv (buf, 0);
396
397 av_store (av, i, sv);
398 buf += SvCUR (sv) + 1;
399 }
400
401 rv = sv_2mortal (newRV_noinc ((SV *)av));
402 }
403
404 PUSHs (rv);
405 }
406 break;
407
408 case REQ_OPEN:
409 {
410 /* convert fd to fh */
411 SV *fh;
412
413 PUSHs (sv_2mortal (newSViv (req->result)));
414 PUTBACK;
415 call_pv ("IO::AIO::_fd2fh", G_SCALAR | G_EVAL);
416 SPAGAIN;
417
418 fh = SvREFCNT_inc (POPs);
419
420 PUSHMARK (SP);
421 XPUSHs (sv_2mortal (fh));
422 }
423 break;
424
425 case REQ_GROUP:
426 req->fd = 2; /* mark group as finished */
427
428 if (req->data)
429 {
430 int i;
431 AV *av = (AV *)req->data;
432
433 EXTEND (SP, AvFILL (av) + 1);
434 for (i = 0; i <= AvFILL (av); ++i)
435 PUSHs (*av_fetch (av, i, 0));
436 }
437 break;
438
439 case REQ_NOP:
440 case REQ_BUSY:
441 break;
442
443 default:
444 PUSHs (sv_2mortal (newSViv (req->result)));
445 break;
446 }
447
448 errno = req->errorno;
449
450 PUTBACK;
451 call_sv (req->callback, G_VOID | G_EVAL);
452 SPAGAIN;
453
454 FREETMPS;
455 LEAVE;
456 }
457
458 if (req->grp)
459 {
460 aio_req grp = req->grp;
461
462 /* unlink request */
463 if (req->grp_next) req->grp_next->grp_prev = req->grp_prev;
464 if (req->grp_prev) req->grp_prev->grp_next = req->grp_next;
465
466 if (grp->grp_first == req)
467 grp->grp_first = req->grp_next;
468
469 aio_grp_dec (grp);
470 }
471
472 if (SvTRUE (ERRSV))
473 {
474 req_free (req);
475 croak (0);
476 }
477 }
478
479 static void req_free (aio_req req)
480 {
481 if (req->self)
482 {
483 sv_unmagic (req->self, PERL_MAGIC_ext);
484 SvREFCNT_dec (req->self);
485 }
486
487 SvREFCNT_dec (req->data);
488 SvREFCNT_dec (req->fh);
489 SvREFCNT_dec (req->fh2);
490 SvREFCNT_dec (req->callback);
491 Safefree (req->statdata);
492
493 if (req->type == REQ_READDIR)
494 free (req->data2ptr);
495
496 Safefree (req);
497 }
498
499 static void req_cancel_subs (aio_req grp)
500 {
501 aio_req sub;
502
503 if (grp->type != REQ_GROUP)
504 return;
505
506 SvREFCNT_dec (grp->fh2);
507 grp->fh2 = 0;
508
509 for (sub = grp->grp_first; sub; sub = sub->grp_next)
510 req_cancel (sub);
511 }
512
513 static void req_cancel (aio_req req)
514 {
515 req->flags |= FLAG_CANCELLED;
516
517 req_cancel_subs (req);
518 }
519
520 static void *aio_proc(void *arg);
521
522 static void start_thread (void)
523 {
524 sigset_t fullsigset, oldsigset;
525 pthread_attr_t attr;
526
527 worker *wrk = calloc (1, sizeof (worker));
528
529 if (!wrk)
530 croak ("unable to allocate worker thread data");
531
532 pthread_attr_init (&attr);
533 pthread_attr_setstacksize (&attr, STACKSIZE);
534 pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED);
535 #ifdef PTHREAD_SCOPE_PROCESS
536 pthread_attr_setscope (&attr, PTHREAD_SCOPE_PROCESS);
537 #endif
538
539 sigfillset (&fullsigset);
540
541 LOCK (wrklock);
542 sigprocmask (SIG_SETMASK, &fullsigset, &oldsigset);
543
544 if (pthread_create (&wrk->tid, &attr, aio_proc, (void *)wrk) == 0)
545 {
546 wrk->prev = &wrk_first;
547 wrk->next = wrk_first.next;
548 wrk_first.next->prev = wrk;
549 wrk_first.next = wrk;
550 ++started;
551 }
552 else
553 free (wrk);
554
555 sigprocmask (SIG_SETMASK, &oldsigset, 0);
556 UNLOCK (wrklock);
557 }
558
559 static void maybe_start_thread ()
560 {
561 #if 0
562 static struct timeval last;
563 struct timeval diff, now;
564 #endif
565
566 if (started >= wanted)
567 return;
568
569 if (nready <= nreqs - get_nready () - get_npending ())
570 return;
571
572 #if 0
573 gettimeofday (&now, 0);
574
575 diff.tv_sec = now.tv_sec - last.tv_sec;
576 diff.tv_usec = now.tv_usec - last.tv_usec;
577
578 if (diff.tv_usec < 0)
579 {
580 --diff.tv_sec;
581 diff.tv_usec += 1000000;
582 }
583
584 if (!diff.tv_sec && diff.tv_usec < 10000)
585 return;
586
587 last = now;
588 #endif
589
590 start_thread ();
591 }
592
593 static void req_send (aio_req req)
594 {
595 ++nreqs;
596
597 LOCK (reqlock);
598 ++nready;
599 reqq_push (&req_queue, req);
600 pthread_cond_signal (&reqwait);
601 UNLOCK (reqlock);
602
603 maybe_start_thread ();
604 }
605
606 static void end_thread (void)
607 {
608 aio_req req;
609
610 Newz (0, req, 1, aio_cb);
611
612 req->type = REQ_QUIT;
613 req->pri = PRI_MAX + PRI_BIAS;
614
615 LOCK (reqlock);
616 reqq_push (&req_queue, req);
617 pthread_cond_signal (&reqwait);
618 UNLOCK (reqlock);
619
620 LOCK (wrklock);
621 --started;
622 UNLOCK (wrklock);
623 }
624
625 static void min_parallel (int nthreads)
626 {
627 if (wanted < nthreads)
628 wanted = nthreads;
629 }
630
631 static void max_parallel (int nthreads)
632 {
633 if (wanted > nthreads)
634 wanted = nthreads;
635
636 while (started > wanted)
637 end_thread ();
638 }
639
640 static void poll_wait ()
641 {
642 fd_set rfd;
643
644 while (nreqs)
645 {
646 int size;
647 if (WORDREAD_UNSAFE) LOCK (reslock);
648 size = res_queue.size;
649 if (WORDREAD_UNSAFE) UNLOCK (reslock);
650
651 if (size)
652 return;
653
654 maybe_start_thread ();
655
656 FD_ZERO(&rfd);
657 FD_SET(respipe [0], &rfd);
658
659 select (respipe [0] + 1, &rfd, 0, 0, 0);
660 }
661 }
662
663 static int poll_cb (int max)
664 {
665 dSP;
666 int count = 0;
667 int do_croak = 0;
668 aio_req req;
669
670 for (;;)
671 {
672 while (max <= 0 || count < max)
673 {
674 maybe_start_thread ();
675
676 LOCK (reslock);
677 req = reqq_shift (&res_queue);
678
679 if (req)
680 {
681 --npending;
682
683 if (!res_queue.size)
684 {
685 /* read any signals sent by the worker threads */
686 char buf [32];
687 while (read (respipe [0], buf, 32) == 32)
688 ;
689 }
690 }
691
692 UNLOCK (reslock);
693
694 if (!req)
695 break;
696
697 --nreqs;
698
699 if (req->type == REQ_GROUP && req->length)
700 {
701 req->fd = 1; /* mark request as delayed */
702 continue;
703 }
704 else
705 {
706 if (req->type == REQ_READ)
707 SvCUR_set (req->data, req->dataoffset + (req->result > 0 ? req->result : 0));
708
709 if (req->data2ptr && (req->type == REQ_READ || req->type == REQ_WRITE))
710 SvREADONLY_off (req->data);
711
712 if (req->statdata)
713 {
714 PL_laststype = req->type == REQ_LSTAT ? OP_LSTAT : OP_STAT;
715 PL_laststatval = req->result;
716 PL_statcache = *(req->statdata);
717 }
718
719 req_invoke (req);
720
721 count++;
722 }
723
724 req_free (req);
725 }
726
727 if (nreqs <= max_outstanding)
728 break;
729
730 poll_wait ();
731
732 max = 0;
733 }
734
735 return count;
736 }
737
738 static void create_pipe ()
739 {
740 if (pipe (respipe))
741 croak ("unable to initialize result pipe");
742
743 if (fcntl (respipe [0], F_SETFL, O_NONBLOCK))
744 croak ("cannot set result pipe to nonblocking mode");
745
746 if (fcntl (respipe [1], F_SETFL, O_NONBLOCK))
747 croak ("cannot set result pipe to nonblocking mode");
748 }
749
750 /*****************************************************************************/
751 /* work around various missing functions */
752
753 #if !HAVE_PREADWRITE
754 # define pread aio_pread
755 # define pwrite aio_pwrite
756
757 /*
758 * make our pread/pwrite safe against themselves, but not against
759 * normal read/write by using a mutex. slows down execution a lot,
760 * but that's your problem, not mine.
761 */
762 static pthread_mutex_t preadwritelock = PTHREAD_MUTEX_INITIALIZER;
763
764 static ssize_t pread (int fd, void *buf, size_t count, off_t offset)
765 {
766 ssize_t res;
767 off_t ooffset;
768
769 LOCK (preadwritelock);
770 ooffset = lseek (fd, 0, SEEK_CUR);
771 lseek (fd, offset, SEEK_SET);
772 res = read (fd, buf, count);
773 lseek (fd, ooffset, SEEK_SET);
774 UNLOCK (preadwritelock);
775
776 return res;
777 }
778
779 static ssize_t pwrite (int fd, void *buf, size_t count, off_t offset)
780 {
781 ssize_t res;
782 off_t ooffset;
783
784 LOCK (preadwritelock);
785 ooffset = lseek (fd, 0, SEEK_CUR);
786 lseek (fd, offset, SEEK_SET);
787 res = write (fd, buf, count);
788 lseek (fd, offset, SEEK_SET);
789 UNLOCK (preadwritelock);
790
791 return res;
792 }
793 #endif
794
795 #if !HAVE_FDATASYNC
796 # define fdatasync fsync
797 #endif
798
799 #if !HAVE_READAHEAD
800 # define readahead(fd,offset,count) aio_readahead (fd, offset, count, self)
801
802 static ssize_t aio_readahead (int fd, off_t offset, size_t count, worker *self)
803 {
804 dBUF;
805
806 while (count > 0)
807 {
808 size_t len = count < AIO_BUFSIZE ? count : AIO_BUFSIZE;
809
810 pread (fd, aio_buf, len, offset);
811 offset += len;
812 count -= len;
813 }
814
815 errno = 0;
816 }
817
818 #endif
819
820 #if !HAVE_READDIR_R
821 # define readdir_r aio_readdir_r
822
823 static pthread_mutex_t readdirlock = PTHREAD_MUTEX_INITIALIZER;
824
825 static int readdir_r (DIR *dirp, struct dirent *ent, struct dirent **res)
826 {
827 struct dirent *e;
828 int errorno;
829
830 LOCK (readdirlock);
831
832 e = readdir (dirp);
833 errorno = errno;
834
835 if (e)
836 {
837 *res = ent;
838 strcpy (ent->d_name, e->d_name);
839 }
840 else
841 *res = 0;
842
843 UNLOCK (readdirlock);
844
845 errno = errorno;
846 return e ? 0 : -1;
847 }
848 #endif
849
850 /* sendfile always needs emulation */
851 static ssize_t sendfile_ (int ofd, int ifd, off_t offset, size_t count, worker *self)
852 {
853 ssize_t res;
854
855 if (!count)
856 return 0;
857
858 #if HAVE_SENDFILE
859 # if __linux
860 res = sendfile (ofd, ifd, &offset, count);
861
862 # elif __freebsd
863 /*
864 * Of course, the freebsd sendfile is a dire hack with no thoughts
865 * wasted on making it similar to other I/O functions.
866 */
867 {
868 off_t sbytes;
869 res = sendfile (ifd, ofd, offset, count, 0, &sbytes, 0);
870
871 if (res < 0 && sbytes)
872 /* maybe only on EAGAIN: as usual, the manpage leaves you guessing */
873 res = sbytes;
874 }
875
876 # elif __hpux
877 res = sendfile (ofd, ifd, offset, count, 0, 0);
878
879 # elif __solaris
880 {
881 struct sendfilevec vec;
882 size_t sbytes;
883
884 vec.sfv_fd = ifd;
885 vec.sfv_flag = 0;
886 vec.sfv_off = offset;
887 vec.sfv_len = count;
888
889 res = sendfilev (ofd, &vec, 1, &sbytes);
890
891 if (res < 0 && sbytes)
892 res = sbytes;
893 }
894
895 # endif
896 #else
897 res = -1;
898 errno = ENOSYS;
899 #endif
900
901 if (res < 0
902 && (errno == ENOSYS || errno == EINVAL || errno == ENOTSOCK
903 #if __solaris
904 || errno == EAFNOSUPPORT || errno == EPROTOTYPE
905 #endif
906 )
907 )
908 {
909 /* emulate sendfile. this is a major pain in the ass */
910 dBUF;
911
912 res = 0;
913
914 while (count)
915 {
916 ssize_t cnt;
917
918 cnt = pread (ifd, aio_buf, count > AIO_BUFSIZE ? AIO_BUFSIZE : count, offset);
919
920 if (cnt <= 0)
921 {
922 if (cnt && !res) res = -1;
923 break;
924 }
925
926 cnt = write (ofd, aio_buf, cnt);
927
928 if (cnt <= 0)
929 {
930 if (cnt && !res) res = -1;
931 break;
932 }
933
934 offset += cnt;
935 res += cnt;
936 count -= cnt;
937 }
938 }
939
940 return res;
941 }
942
943 /* read a full directory */
944 static void scandir_ (aio_req req, worker *self)
945 {
946 DIR *dirp;
947 union
948 {
949 struct dirent d;
950 char b [offsetof (struct dirent, d_name) + NAME_MAX + 1];
951 } *u;
952 struct dirent *entp;
953 char *name, *names;
954 int memlen = 4096;
955 int memofs = 0;
956 int res = 0;
957 int errorno;
958
959 LOCK (wrklock);
960 self->dirp = dirp = opendir (req->dataptr);
961 self->dbuf = u = malloc (sizeof (*u));
962 req->data2ptr = names = malloc (memlen);
963 UNLOCK (wrklock);
964
965 if (dirp && u && names)
966 for (;;)
967 {
968 errno = 0;
969 readdir_r (dirp, &u->d, &entp);
970
971 if (!entp)
972 break;
973
974 name = entp->d_name;
975
976 if (name [0] != '.' || (name [1] && (name [1] != '.' || name [2])))
977 {
978 int len = strlen (name) + 1;
979
980 res++;
981
982 while (memofs + len > memlen)
983 {
984 memlen *= 2;
985 LOCK (wrklock);
986 req->data2ptr = names = realloc (names, memlen);
987 UNLOCK (wrklock);
988
989 if (!names)
990 break;
991 }
992
993 memcpy (names + memofs, name, len);
994 memofs += len;
995 }
996 }
997
998 if (errno)
999 res = -1;
1000
1001 req->result = res;
1002 }
1003
1004 /*****************************************************************************/
1005
1006 static void *aio_proc (void *thr_arg)
1007 {
1008 aio_req req;
1009 worker *self = (worker *)thr_arg;
1010
1011 for (;;)
1012 {
1013 LOCK (reqlock);
1014
1015 for (;;)
1016 {
1017 self->req = req = reqq_shift (&req_queue);
1018
1019 if (req)
1020 break;
1021
1022 pthread_cond_wait (&reqwait, &reqlock);
1023 }
1024
1025 --nready;
1026
1027 UNLOCK (reqlock);
1028
1029 errno = 0; /* strictly unnecessary */
1030
1031 if (!(req->flags & FLAG_CANCELLED))
1032 switch (req->type)
1033 {
1034 case REQ_READ: req->result = pread (req->fd, req->dataptr, req->length, req->offset); break;
1035 case REQ_WRITE: req->result = pwrite (req->fd, req->dataptr, req->length, req->offset); break;
1036
1037 case REQ_READAHEAD: req->result = readahead (req->fd, req->offset, req->length); break;
1038 case REQ_SENDFILE: req->result = sendfile_ (req->fd, req->fd2, req->offset, req->length, self); break;
1039
1040 case REQ_STAT: req->result = stat (req->dataptr, req->statdata); break;
1041 case REQ_LSTAT: req->result = lstat (req->dataptr, req->statdata); break;
1042 case REQ_FSTAT: req->result = fstat (req->fd , req->statdata); break;
1043
1044 case REQ_OPEN: req->result = open (req->dataptr, req->fd, req->mode); break;
1045 case REQ_CLOSE: req->result = close (req->fd); break;
1046 case REQ_UNLINK: req->result = unlink (req->dataptr); break;
1047 case REQ_RMDIR: req->result = rmdir (req->dataptr); break;
1048 case REQ_RENAME: req->result = rename (req->data2ptr, req->dataptr); break;
1049 case REQ_LINK: req->result = link (req->data2ptr, req->dataptr); break;
1050 case REQ_SYMLINK: req->result = symlink (req->data2ptr, req->dataptr); break;
1051 case REQ_MKNOD: req->result = mknod (req->data2ptr, req->mode, (dev_t)req->offset); break;
1052
1053 case REQ_FDATASYNC: req->result = fdatasync (req->fd); break;
1054 case REQ_FSYNC: req->result = fsync (req->fd); break;
1055 case REQ_READDIR: scandir_ (req, self); break;
1056
1057 case REQ_BUSY:
1058 {
1059 struct timeval tv;
1060
1061 tv.tv_sec = req->fd;
1062 tv.tv_usec = req->fd2;
1063
1064 req->result = select (0, 0, 0, 0, &tv);
1065 }
1066
1067 case REQ_GROUP:
1068 case REQ_NOP:
1069 break;
1070
1071 case REQ_QUIT:
1072 LOCK (wrklock);
1073 worker_free (self);
1074 --started;
1075 UNLOCK (wrklock);
1076 return 0;
1077
1078 default:
1079 req->result = ENOSYS;
1080 break;
1081 }
1082
1083 req->errorno = errno;
1084
1085 LOCK (reslock);
1086
1087 ++npending;
1088
1089 if (!reqq_push (&res_queue, req))
1090 /* write a dummy byte to the pipe so fh becomes ready */
1091 write (respipe [1], &respipe, 1);
1092
1093 self->req = 0;
1094 worker_clear (self);
1095
1096 UNLOCK (reslock);
1097 }
1098 }
1099
1100 /*****************************************************************************/
1101
1102 static void atfork_prepare (void)
1103 {
1104 LOCK (wrklock);
1105 LOCK (reqlock);
1106 LOCK (reslock);
1107 #if !HAVE_PREADWRITE
1108 LOCK (preadwritelock);
1109 #endif
1110 #if !HAVE_READDIR_R
1111 LOCK (readdirlock);
1112 #endif
1113 }
1114
1115 static void atfork_parent (void)
1116 {
1117 #if !HAVE_READDIR_R
1118 UNLOCK (readdirlock);
1119 #endif
1120 #if !HAVE_PREADWRITE
1121 UNLOCK (preadwritelock);
1122 #endif
1123 UNLOCK (reslock);
1124 UNLOCK (reqlock);
1125 UNLOCK (wrklock);
1126 }
1127
1128 static void atfork_child (void)
1129 {
1130 aio_req prv;
1131
1132 while (prv = reqq_shift (&req_queue))
1133 req_free (prv);
1134
1135 while (prv = reqq_shift (&res_queue))
1136 req_free (prv);
1137
1138 while (wrk_first.next != &wrk_first)
1139 {
1140 worker *wrk = wrk_first.next;
1141
1142 if (wrk->req)
1143 req_free (wrk->req);
1144
1145 worker_clear (wrk);
1146 worker_free (wrk);
1147 }
1148
1149 started = 0;
1150 nreqs = 0;
1151
1152 close (respipe [0]);
1153 close (respipe [1]);
1154 create_pipe ();
1155
1156 atfork_parent ();
1157 }
1158
1159 #define dREQ \
1160 aio_req req; \
1161 int req_pri = next_pri; \
1162 next_pri = DEFAULT_PRI + PRI_BIAS; \
1163 \
1164 if (SvOK (callback) && !SvROK (callback)) \
1165 croak ("callback must be undef or of reference type"); \
1166 \
1167 Newz (0, req, 1, aio_cb); \
1168 if (!req) \
1169 croak ("out of memory during aio_req allocation"); \
1170 \
1171 req->callback = newSVsv (callback); \
1172 req->pri = req_pri
1173
1174 #define REQ_SEND \
1175 req_send (req); \
1176 \
1177 if (GIMME_V != G_VOID) \
1178 XPUSHs (req_sv (req, AIO_REQ_KLASS));
1179
1180 MODULE = IO::AIO PACKAGE = IO::AIO
1181
1182 PROTOTYPES: ENABLE
1183
1184 BOOT:
1185 {
1186 HV *stash = gv_stashpv ("IO::AIO", 1);
1187
1188 newCONSTSUB (stash, "EXDEV", newSViv (EXDEV));
1189 newCONSTSUB (stash, "O_RDONLY", newSViv (O_RDONLY));
1190 newCONSTSUB (stash, "O_WRONLY", newSViv (O_WRONLY));
1191 newCONSTSUB (stash, "O_CREAT", newSViv (O_CREAT));
1192 newCONSTSUB (stash, "O_TRUNC", newSViv (O_TRUNC));
1193 newCONSTSUB (stash, "S_IFIFO", newSViv (S_IFIFO));
1194
1195 create_pipe ();
1196 pthread_atfork (atfork_prepare, atfork_parent, atfork_child);
1197
1198 start_thread ();
1199 }
1200
1201 void
1202 min_parallel (int nthreads)
1203 PROTOTYPE: $
1204
1205 void
1206 max_parallel (int nthreads)
1207 PROTOTYPE: $
1208
1209 int
1210 max_outstanding (int maxreqs)
1211 PROTOTYPE: $
1212 CODE:
1213 RETVAL = max_outstanding;
1214 max_outstanding = maxreqs;
1215 OUTPUT:
1216 RETVAL
1217
1218 void
1219 aio_open (pathname,flags,mode,callback=&PL_sv_undef)
1220 SV * pathname
1221 int flags
1222 int mode
1223 SV * callback
1224 PROTOTYPE: $$$;$
1225 PPCODE:
1226 {
1227 dREQ;
1228
1229 req->type = REQ_OPEN;
1230 req->data = newSVsv (pathname);
1231 req->dataptr = SvPVbyte_nolen (req->data);
1232 req->fd = flags;
1233 req->mode = mode;
1234
1235 REQ_SEND;
1236 }
1237
1238 void
1239 aio_close (fh,callback=&PL_sv_undef)
1240 SV * fh
1241 SV * callback
1242 PROTOTYPE: $;$
1243 ALIAS:
1244 aio_close = REQ_CLOSE
1245 aio_fsync = REQ_FSYNC
1246 aio_fdatasync = REQ_FDATASYNC
1247 PPCODE:
1248 {
1249 dREQ;
1250
1251 req->type = ix;
1252 req->fh = newSVsv (fh);
1253 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh)));
1254
1255 REQ_SEND (req);
1256 }
1257
1258 void
1259 aio_read (fh,offset,length,data,dataoffset,callback=&PL_sv_undef)
1260 SV * fh
1261 UV offset
1262 UV length
1263 SV * data
1264 UV dataoffset
1265 SV * callback
1266 ALIAS:
1267 aio_read = REQ_READ
1268 aio_write = REQ_WRITE
1269 PROTOTYPE: $$$$$;$
1270 PPCODE:
1271 {
1272 aio_req req;
1273 STRLEN svlen;
1274 char *svptr = SvPVbyte (data, svlen);
1275
1276 SvUPGRADE (data, SVt_PV);
1277 SvPOK_on (data);
1278
1279 if (dataoffset < 0)
1280 dataoffset += svlen;
1281
1282 if (dataoffset < 0 || dataoffset > svlen)
1283 croak ("data offset outside of string");
1284
1285 if (ix == REQ_WRITE)
1286 {
1287 /* write: check length and adjust. */
1288 if (length < 0 || length + dataoffset > svlen)
1289 length = svlen - dataoffset;
1290 }
1291 else
1292 {
1293 /* read: grow scalar as necessary */
1294 svptr = SvGROW (data, length + dataoffset);
1295 }
1296
1297 if (length < 0)
1298 croak ("length must not be negative");
1299
1300 {
1301 dREQ;
1302
1303 req->type = ix;
1304 req->fh = newSVsv (fh);
1305 req->fd = PerlIO_fileno (ix == REQ_READ ? IoIFP (sv_2io (fh))
1306 : IoOFP (sv_2io (fh)));
1307 req->offset = offset;
1308 req->length = length;
1309 req->data = SvREFCNT_inc (data);
1310 req->dataptr = (char *)svptr + dataoffset;
1311
1312 if (!SvREADONLY (data))
1313 {
1314 SvREADONLY_on (data);
1315 req->data2ptr = (void *)data;
1316 }
1317
1318 REQ_SEND;
1319 }
1320 }
1321
1322 void
1323 aio_sendfile (out_fh,in_fh,in_offset,length,callback=&PL_sv_undef)
1324 SV * out_fh
1325 SV * in_fh
1326 UV in_offset
1327 UV length
1328 SV * callback
1329 PROTOTYPE: $$$$;$
1330 PPCODE:
1331 {
1332 dREQ;
1333
1334 req->type = REQ_SENDFILE;
1335 req->fh = newSVsv (out_fh);
1336 req->fd = PerlIO_fileno (IoIFP (sv_2io (out_fh)));
1337 req->fh2 = newSVsv (in_fh);
1338 req->fd2 = PerlIO_fileno (IoIFP (sv_2io (in_fh)));
1339 req->offset = in_offset;
1340 req->length = length;
1341
1342 REQ_SEND;
1343 }
1344
1345 void
1346 aio_readahead (fh,offset,length,callback=&PL_sv_undef)
1347 SV * fh
1348 UV offset
1349 IV length
1350 SV * callback
1351 PROTOTYPE: $$$;$
1352 PPCODE:
1353 {
1354 dREQ;
1355
1356 req->type = REQ_READAHEAD;
1357 req->fh = newSVsv (fh);
1358 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh)));
1359 req->offset = offset;
1360 req->length = length;
1361
1362 REQ_SEND;
1363 }
1364
1365 void
1366 aio_stat (fh_or_path,callback=&PL_sv_undef)
1367 SV * fh_or_path
1368 SV * callback
1369 ALIAS:
1370 aio_stat = REQ_STAT
1371 aio_lstat = REQ_LSTAT
1372 PPCODE:
1373 {
1374 dREQ;
1375
1376 New (0, req->statdata, 1, Stat_t);
1377 if (!req->statdata)
1378 {
1379 req_free (req);
1380 croak ("out of memory during aio_req->statdata allocation");
1381 }
1382
1383 if (SvPOK (fh_or_path))
1384 {
1385 req->type = ix;
1386 req->data = newSVsv (fh_or_path);
1387 req->dataptr = SvPVbyte_nolen (req->data);
1388 }
1389 else
1390 {
1391 req->type = REQ_FSTAT;
1392 req->fh = newSVsv (fh_or_path);
1393 req->fd = PerlIO_fileno (IoIFP (sv_2io (fh_or_path)));
1394 }
1395
1396 REQ_SEND;
1397 }
1398
1399 void
1400 aio_unlink (pathname,callback=&PL_sv_undef)
1401 SV * pathname
1402 SV * callback
1403 ALIAS:
1404 aio_unlink = REQ_UNLINK
1405 aio_rmdir = REQ_RMDIR
1406 aio_readdir = REQ_READDIR
1407 PPCODE:
1408 {
1409 dREQ;
1410
1411 req->type = ix;
1412 req->data = newSVsv (pathname);
1413 req->dataptr = SvPVbyte_nolen (req->data);
1414
1415 REQ_SEND;
1416 }
1417
1418 void
1419 aio_link (oldpath,newpath,callback=&PL_sv_undef)
1420 SV * oldpath
1421 SV * newpath
1422 SV * callback
1423 ALIAS:
1424 aio_link = REQ_LINK
1425 aio_symlink = REQ_SYMLINK
1426 aio_rename = REQ_RENAME
1427 PPCODE:
1428 {
1429 dREQ;
1430
1431 req->type = ix;
1432 req->fh = newSVsv (oldpath);
1433 req->data2ptr = SvPVbyte_nolen (req->fh);
1434 req->data = newSVsv (newpath);
1435 req->dataptr = SvPVbyte_nolen (req->data);
1436
1437 REQ_SEND;
1438 }
1439
1440 void
1441 aio_mknod (pathname,mode,dev,callback=&PL_sv_undef)
1442 SV * pathname
1443 SV * callback
1444 UV mode
1445 UV dev
1446 PPCODE:
1447 {
1448 dREQ;
1449
1450 req->type = REQ_MKNOD;
1451 req->data = newSVsv (pathname);
1452 req->dataptr = SvPVbyte_nolen (req->data);
1453 req->mode = (mode_t)mode;
1454 req->offset = dev;
1455
1456 REQ_SEND;
1457 }
1458
1459 void
1460 aio_busy (delay,callback=&PL_sv_undef)
1461 double delay
1462 SV * callback
1463 PPCODE:
1464 {
1465 dREQ;
1466
1467 req->type = REQ_BUSY;
1468 req->fd = delay < 0. ? 0 : delay;
1469 req->fd2 = delay < 0. ? 0 : 1000. * (delay - req->fd);
1470
1471 REQ_SEND;
1472 }
1473
1474 void
1475 aio_group (callback=&PL_sv_undef)
1476 SV * callback
1477 PROTOTYPE: ;$
1478 PPCODE:
1479 {
1480 dREQ;
1481
1482 req->type = REQ_GROUP;
1483 req_send (req);
1484
1485 XPUSHs (req_sv (req, AIO_GRP_KLASS));
1486 }
1487
1488 void
1489 aio_nop (callback=&PL_sv_undef)
1490 SV * callback
1491 PPCODE:
1492 {
1493 dREQ;
1494
1495 req->type = REQ_NOP;
1496
1497 REQ_SEND;
1498 }
1499
1500 int
1501 aioreq_pri (int pri = 0)
1502 PROTOTYPE: ;$
1503 CODE:
1504 RETVAL = next_pri - PRI_BIAS;
1505 if (items > 0)
1506 {
1507 if (pri < PRI_MIN) pri = PRI_MIN;
1508 if (pri > PRI_MAX) pri = PRI_MAX;
1509 next_pri = pri + PRI_BIAS;
1510 }
1511 OUTPUT:
1512 RETVAL
1513
1514 void
1515 aioreq_nice (int nice = 0)
1516 CODE:
1517 nice = next_pri - nice;
1518 if (nice < PRI_MIN) nice = PRI_MIN;
1519 if (nice > PRI_MAX) nice = PRI_MAX;
1520 next_pri = nice + PRI_BIAS;
1521
1522 void
1523 flush ()
1524 PROTOTYPE:
1525 CODE:
1526 while (nreqs)
1527 {
1528 poll_wait ();
1529 poll_cb (0);
1530 }
1531
1532 void
1533 poll()
1534 PROTOTYPE:
1535 CODE:
1536 if (nreqs)
1537 {
1538 poll_wait ();
1539 poll_cb (0);
1540 }
1541
1542 int
1543 poll_fileno()
1544 PROTOTYPE:
1545 CODE:
1546 RETVAL = respipe [0];
1547 OUTPUT:
1548 RETVAL
1549
1550 int
1551 poll_cb(...)
1552 PROTOTYPE:
1553 CODE:
1554 RETVAL = poll_cb (0);
1555 OUTPUT:
1556 RETVAL
1557
1558 int
1559 poll_some(int max = 0)
1560 PROTOTYPE: $
1561 CODE:
1562 RETVAL = poll_cb (max);
1563 OUTPUT:
1564 RETVAL
1565
1566 void
1567 poll_wait()
1568 PROTOTYPE:
1569 CODE:
1570 if (nreqs)
1571 poll_wait ();
1572
1573 int
1574 nreqs()
1575 PROTOTYPE:
1576 CODE:
1577 RETVAL = nreqs;
1578 OUTPUT:
1579 RETVAL
1580
1581 int
1582 nready()
1583 PROTOTYPE:
1584 CODE:
1585 RETVAL = get_nready ();
1586 OUTPUT:
1587 RETVAL
1588
1589 int
1590 npending()
1591 PROTOTYPE:
1592 CODE:
1593 RETVAL = get_npending ();
1594 OUTPUT:
1595 RETVAL
1596
1597 PROTOTYPES: DISABLE
1598
1599 MODULE = IO::AIO PACKAGE = IO::AIO::REQ
1600
1601 void
1602 cancel (aio_req_ornot req)
1603 CODE:
1604 req_cancel (req);
1605
1606 void
1607 cb (aio_req_ornot req, SV *callback=&PL_sv_undef)
1608 CODE:
1609 SvREFCNT_dec (req->callback);
1610 req->callback = newSVsv (callback);
1611
1612 MODULE = IO::AIO PACKAGE = IO::AIO::GRP
1613
1614 void
1615 add (aio_req grp, ...)
1616 PPCODE:
1617 {
1618 int i;
1619 aio_req req;
1620
1621 if (grp->fd == 2)
1622 croak ("cannot add requests to IO::AIO::GRP after the group finished");
1623
1624 for (i = 1; i < items; ++i )
1625 {
1626 if (GIMME_V != G_VOID)
1627 XPUSHs (sv_2mortal (newSVsv (ST (i))));
1628
1629 req = SvAIO_REQ (ST (i));
1630
1631 if (req)
1632 {
1633 ++grp->length;
1634 req->grp = grp;
1635
1636 req->grp_prev = 0;
1637 req->grp_next = grp->grp_first;
1638
1639 if (grp->grp_first)
1640 grp->grp_first->grp_prev = req;
1641
1642 grp->grp_first = req;
1643 }
1644 }
1645 }
1646
1647 void
1648 cancel_subs (aio_req_ornot req)
1649 CODE:
1650 req_cancel_subs (req);
1651
1652 void
1653 result (aio_req grp, ...)
1654 CODE:
1655 {
1656 int i;
1657 AV *av;
1658
1659 grp->errorno = errno;
1660
1661 av = newAV ();
1662
1663 for (i = 1; i < items; ++i )
1664 av_push (av, newSVsv (ST (i)));
1665
1666 SvREFCNT_dec (grp->data);
1667 grp->data = (SV *)av;
1668 }
1669
1670 void
1671 errno (aio_req grp, int errorno = errno)
1672 CODE:
1673 grp->errorno = errorno;
1674
1675 void
1676 limit (aio_req grp, int limit)
1677 CODE:
1678 grp->fd2 = limit;
1679 aio_grp_feed (grp);
1680
1681 void
1682 feed (aio_req grp, SV *callback=&PL_sv_undef)
1683 CODE:
1684 {
1685 SvREFCNT_dec (grp->fh2);
1686 grp->fh2 = newSVsv (callback);
1687
1688 if (grp->fd2 <= 0)
1689 grp->fd2 = 2;
1690
1691 aio_grp_feed (grp);
1692 }
1693