#define PERL_NO_GET_CONTEXT #include "EXTERN.h" #include "perl.h" #include "XSUB.h" #include #include #include #include #include #include #include typedef void *InputStream; /* hack, but 5.6.1 is simply toooo old ;) */ typedef void *OutputStream; /* hack, but 5.6.1 is simply toooo old ;) */ typedef void *InOutStream; /* hack, but 5.6.1 is simply toooo old ;) */ #if __i386 || __amd64 # define STACKSIZE ( 256 * sizeof (long)) #elif __ia64 # define STACKSIZE (8192 * sizeof (long)) #else # define STACKSIZE ( 512 * sizeof (long)) #endif enum { REQ_QUIT, REQ_OPEN, REQ_CLOSE, REQ_READ, REQ_WRITE, REQ_STAT, REQ_LSTAT, REQ_FSTAT, REQ_UNLINK }; typedef struct { char stack[STACKSIZE]; } aio_thread; typedef struct aio_cb { struct aio_cb *next; int type; aio_thread *thread; int fd; off_t offset; size_t length; ssize_t result; mode_t mode; /* open */ int errorno; SV *data, *callback; void *dataptr; STRLEN dataoffset; Stat_t *statdata; } aio_cb; typedef aio_cb *aio_req; static int started; static int nreqs; static int reqpipe[2], respipe[2]; static aio_req qs, qe; /* queue start, queue end */ static int aio_proc(void *arg); static void start_thread (void) { aio_thread *thr; New (0, thr, 1, aio_thread); if (clone (aio_proc, &(thr->stack[STACKSIZE - 16]), CLONE_VM|CLONE_FS|CLONE_FILES, thr) >= 0) started++; else Safefree (thr); } static void send_reqs (void) { /* this write is atomic */ while (qs && write (reqpipe[1], &qs, sizeof qs) == sizeof qs) { qs = qs->next; if (!qs) qe = 0; } } static void send_req (aio_req req) { nreqs++; req->next = 0; if (qe) { qe->next = req; qe = req; } else qe = qs = req; send_reqs (); } static void end_thread (void) { aio_req req; New (0, req, 1, aio_cb); req->type = REQ_QUIT; send_req (req); } static void read_write (pTHX_ int dowrite, int fd, off_t offset, size_t length, SV *data, STRLEN dataoffset, SV *callback) { aio_req req; STRLEN svlen; char *svptr = SvPV (data, svlen); SvUPGRADE (data, SVt_PV); SvPOK_on (data); if (dataoffset < 0) dataoffset += svlen; if (dataoffset < 0 || dataoffset > svlen) croak ("data offset outside of string"); if (dowrite) { /* write: check length and adjust. */ if (length < 0 || length + dataoffset > svlen) length = svlen - dataoffset; } else { /* read: grow scalar as necessary */ svptr = SvGROW (data, length + dataoffset); } if (length < 0) croak ("length must not be negative"); Newz (0, req, 1, aio_cb); if (!req) croak ("out of memory during aio_req allocation"); req->type = dowrite ? REQ_WRITE : REQ_READ; req->fd = fd; req->offset = offset; req->length = length; req->data = SvREFCNT_inc (data); req->dataptr = (char *)svptr + dataoffset; req->callback = SvREFCNT_inc (callback); send_req (req); } static void poll_wait () { fd_set rfd; FD_ZERO(&rfd); FD_SET(respipe[0], &rfd); select (respipe[0] + 1, &rfd, 0, 0, 0); } static int poll_cb (pTHX) { dSP; int count = 0; aio_req req; while (read (respipe[0], (void *)&req, sizeof (req)) == sizeof (req)) { nreqs--; if (req->type == REQ_QUIT) { Safefree (req->thread); started--; } else { int errorno = errno; errno = req->errorno; if (req->type == REQ_READ) SvCUR_set (req->data, req->dataoffset + req->result > 0 ? req->result : 0); if (req->data) SvREFCNT_dec (req->data); if (req->type == REQ_STAT || req->type == REQ_LSTAT || req->type == REQ_FSTAT) { PL_laststype = req->type == REQ_LSTAT ? OP_LSTAT : OP_STAT; PL_laststatval = req->result; PL_statcache = *(req->statdata); Safefree (req->statdata); } PUSHMARK (SP); XPUSHs (sv_2mortal (newSViv (req->result))); PUTBACK; call_sv (req->callback, G_VOID); SPAGAIN; if (req->callback) SvREFCNT_dec (req->callback); errno = errorno; count++; } Safefree (req); } if (qs) send_reqs (); return count; } static sigset_t fullsigset; #undef errno #include #include #if BYTE_ORDER == LITTLE_ENDIAN # define LONG_LONG_PAIR(HI, LO) LO, HI #elif BYTE_ORDER == BIG_ENDIAN # define LONG_LONG_PAIR(HI, LO) HI, LO #endif #if __alpha || __ia64 || __hppa || __v850__ # define stat kernelstat # define stat64 kernelstat64 # include # undef stat # undef stat64 #else # define kernelstat stat # define kernelstat64 stat64 #endif #define COPY_STATDATA \ req->statdata->st_dev = statdata.st_dev; \ req->statdata->st_ino = statdata.st_ino; \ req->statdata->st_mode = statdata.st_mode; \ req->statdata->st_nlink = statdata.st_nlink; \ req->statdata->st_uid = statdata.st_uid; \ req->statdata->st_gid = statdata.st_gid; \ req->statdata->st_rdev = statdata.st_rdev; \ req->statdata->st_size = statdata.st_size; \ req->statdata->st_atime = statdata.st_atime; \ req->statdata->st_mtime = statdata.st_mtime; \ req->statdata->st_ctime = statdata.st_ctime; \ req->statdata->st_blksize = statdata.st_blksize; \ req->statdata->st_blocks = statdata.st_blocks; \ static int aio_proc (void *thr_arg) { aio_thread *thr = thr_arg; aio_req req; int errno; /* this is very much kernel-specific :(:(:( */ /* we rely on gcc's ability to create closures. */ _syscall3(int,read,int,fd,char *,buf,size_t,count) _syscall3(int,write,int,fd,char *,buf,size_t,count) _syscall3(int,open,char *,pathname,int,flags,mode_t,mode) _syscall1(int,close,int,fd) #if __NR_pread64 _syscall5(int,pread64,int,fd,char *,buf,size_t,count,unsigned int,offset_lh,unsigned int,offset_hl) _syscall5(int,pwrite64,int,fd,char *,buf,size_t,count,unsigned int,offset_lh,unsigned int,offset_hl) #elif __NR_pread _syscall4(int,pread,int,fd,char *,buf,size_t,count,offset_t,offset) _syscall4(int,pwrite,int,fd,char *,buf,size_t,count,offset_t,offset) #else # error "neither pread nor pread64 defined" #endif #if __NR_stat64 _syscall2(int,stat64, const char *, filename, struct kernelstat64 *, buf) _syscall2(int,lstat64, const char *, filename, struct kernelstat64 *, buf) _syscall2(int,fstat64, int, fd, struct kernelstat64 *, buf) #elif __NR_stat _syscall2(int,stat, const char *, filename, struct kernelstat *, buf) _syscall2(int,lstat, const char *, filename, struct kernelstat *, buf) _syscall2(int,fstat, int, fd, struct kernelstat *, buf) #else # error "neither stat64 nor stat defined" #endif _syscall1(int,unlink, char *, filename); sigprocmask (SIG_SETMASK, &fullsigset, 0); prctl (PR_SET_PDEATHSIG, SIGKILL); /* then loop */ while (read (reqpipe[0], (void *)&req, sizeof (req)) == sizeof (req)) { req->thread = thr; errno = 0; /* strictly unnecessary */ switch (req->type) { #if __NR_pread64 case REQ_READ: req->result = pread64 (req->fd, req->dataptr, req->length, LONG_LONG_PAIR (req->offset >> 32, req->offset & 0xffffffff)); break; case REQ_WRITE: req->result = pwrite64(req->fd, req->dataptr, req->length, LONG_LONG_PAIR (req->offset >> 32, req->offset & 0xffffffff)); break; #else case REQ_READ: req->result = pread (req->fd, req->dataptr, req->length, req->offset); break; case REQ_WRITE: req->result = pwrite (req->fd, req->dataptr, req->length, req->offset); break; #endif #if __NR_stat64 struct kernelstat64 statdata; case REQ_STAT: req->result = stat64 (req->dataptr, &statdata); COPY_STATDATA; break; case REQ_LSTAT: req->result = lstat64 (req->dataptr, &statdata); COPY_STATDATA; break; case REQ_FSTAT: req->result = fstat64 (req->fd, &statdata); COPY_STATDATA; break; #else struct kernelstat statdata; case REQ_STAT: req->result = stat (req->dataptr, &statdata); COPY_STATDATA; break; case REQ_LSTAT: req->result = lstat (req->dataptr, &statdata); COPY_STATDATA; break; case REQ_FSTAT: req->result = fstat (req->fd, &statdata); COPY_STATDATA; break; #endif case REQ_OPEN: req->result = open (req->dataptr, req->fd, req->mode); break; case REQ_CLOSE: req->result = close (req->fd); break; case REQ_UNLINK: req->result = unlink (req->dataptr); break; case REQ_QUIT: default: write (respipe[1], (void *)&req, sizeof (req)); return 0; } req->errorno = errno; write (respipe[1], (void *)&req, sizeof (req)); } return 0; } MODULE = Linux::AIO PACKAGE = Linux::AIO BOOT: { sigfillset (&fullsigset); sigdelset (&fullsigset, SIGTERM); sigdelset (&fullsigset, SIGQUIT); sigdelset (&fullsigset, SIGABRT); sigdelset (&fullsigset, SIGINT); if (pipe (reqpipe) || pipe (respipe)) croak ("unable to initialize request or result pipe"); if (fcntl (reqpipe[1], F_SETFL, O_NONBLOCK)) croak ("cannot set result pipe to nonblocking mode"); if (fcntl (respipe[0], F_SETFL, O_NONBLOCK)) croak ("cannot set result pipe to nonblocking mode"); } void min_parallel(nthreads) int nthreads PROTOTYPE: $ CODE: while (nthreads > started) start_thread (); void max_parallel(nthreads) int nthreads PROTOTYPE: $ CODE: int cur = started; while (cur > nthreads) { end_thread (); cur--; } while (started > nthreads) { poll_wait (); poll_cb (aTHX); } void aio_open(pathname,flags,mode,callback) SV * pathname int flags int mode SV * callback PROTOTYPE: $$$$ CODE: aio_req req; Newz (0, req, 1, aio_cb); if (!req) croak ("out of memory during aio_req allocation"); req->type = REQ_OPEN; req->data = newSVsv (pathname); req->dataptr = SvPV_nolen (req->data); req->fd = flags; req->mode = mode; req->callback = SvREFCNT_inc (callback); send_req (req); void aio_close(fh,callback) InputStream fh SV * callback PROTOTYPE: $$ CODE: aio_req req; Newz (0, req, 1, aio_cb); if (!req) croak ("out of memory during aio_req allocation"); req->type = REQ_CLOSE; req->fd = PerlIO_fileno (fh); req->callback = SvREFCNT_inc (callback); send_req (req); void aio_read(fh,offset,length,data,dataoffset,callback) InputStream fh UV offset IV length SV * data IV dataoffset SV * callback PROTOTYPE: $$$$$$ CODE: read_write (aTHX_ 0, PerlIO_fileno (fh), offset, length, data, dataoffset, callback); void aio_write(fh,offset,length,data,dataoffset,callback) OutputStream fh UV offset IV length SV * data IV dataoffset SV * callback PROTOTYPE: $$$$$$ CODE: read_write (aTHX_ 1, PerlIO_fileno (fh), offset, length, data, dataoffset, callback); void aio_stat(fh_or_path,callback) SV * fh_or_path SV * callback PROTOTYPE: $$ ALIAS: aio_lstat = 1 CODE: aio_req req; Newz (0, req, 1, aio_cb); if (!req) croak ("out of memory during aio_req allocation"); New (0, req->statdata, 1, Stat_t); if (!req->statdata) croak ("out of memory during aio_req->statdata allocation"); if (SvPOK (fh_or_path)) { req->type = ix ? REQ_LSTAT : REQ_STAT; req->data = newSVsv (fh_or_path); req->dataptr = SvPV_nolen (req->data); } else { req->type = REQ_FSTAT; req->fd = PerlIO_fileno (IoIFP (sv_2io (fh_or_path))); } req->callback = SvREFCNT_inc (callback); send_req (req); void aio_unlink(pathname,callback) SV * pathname SV * callback PROTOTYPE: $$ CODE: aio_req req; Newz (0, req, 1, aio_cb); if (!req) croak ("out of memory during aio_req allocation"); req->type = REQ_UNLINK; req->data = newSVsv (pathname); req->dataptr = SvPV_nolen (req->data); req->callback = SvREFCNT_inc (callback); send_req (req); int poll_fileno() PROTOTYPE: CODE: RETVAL = respipe[0]; OUTPUT: RETVAL int poll_cb(...) PROTOTYPE: CODE: RETVAL = poll_cb (aTHX); OUTPUT: RETVAL void poll_wait() PROTOTYPE: CODE: poll_wait (); int nreqs() PROTOTYPE: CODE: RETVAL = nreqs; OUTPUT: RETVAL