1 |
#define PERL_NO_GET_CONTEXT |
2 |
|
3 |
#include "EXTERN.h" |
4 |
#include "perl.h" |
5 |
#include "XSUB.h" |
6 |
|
7 |
#include <sys/types.h> |
8 |
#include <sys/stat.h> |
9 |
#include <unistd.h> |
10 |
#include <fcntl.h> |
11 |
#include <signal.h> |
12 |
#include <sched.h> |
13 |
#include <endian.h> |
14 |
|
15 |
typedef void *InputStream; /* hack, but 5.6.1 is simply toooo old ;) */ |
16 |
typedef void *OutputStream; /* hack, but 5.6.1 is simply toooo old ;) */ |
17 |
typedef void *InOutStream; /* hack, but 5.6.1 is simply toooo old ;) */ |
18 |
|
19 |
#if __i386 || __amd64 |
20 |
# define STACKSIZE ( 256 * sizeof (long)) |
21 |
#elif __ia64 |
22 |
# define STACKSIZE (8192 * sizeof (long)) |
23 |
#else |
24 |
# define STACKSIZE ( 512 * sizeof (long)) |
25 |
#endif |
26 |
|
27 |
enum { |
28 |
REQ_QUIT, |
29 |
REQ_OPEN, REQ_CLOSE, |
30 |
REQ_READ, REQ_WRITE, REQ_READAHEAD, |
31 |
REQ_STAT, REQ_LSTAT, REQ_FSTAT, REQ_UNLINK, |
32 |
REQ_FSYNC, REQ_FDATASYNC, |
33 |
}; |
34 |
|
35 |
typedef struct { |
36 |
char stack[STACKSIZE]; |
37 |
} aio_thread; |
38 |
|
39 |
typedef struct aio_cb { |
40 |
struct aio_cb *next; |
41 |
|
42 |
int type; |
43 |
aio_thread *thread; |
44 |
|
45 |
int fd; |
46 |
off_t offset; |
47 |
size_t length; |
48 |
ssize_t result; |
49 |
mode_t mode; /* open */ |
50 |
int errorno; |
51 |
SV *data, *callback; |
52 |
void *dataptr; |
53 |
STRLEN dataoffset; |
54 |
|
55 |
Stat_t *statdata; |
56 |
} aio_cb; |
57 |
|
58 |
typedef aio_cb *aio_req; |
59 |
|
60 |
static int started; |
61 |
static int nreqs; |
62 |
static int reqpipe[2], respipe[2]; |
63 |
|
64 |
static aio_req qs, qe; /* queue start, queue end */ |
65 |
|
66 |
static int aio_proc(void *arg); |
67 |
|
68 |
static void |
69 |
start_thread (void) |
70 |
{ |
71 |
aio_thread *thr; |
72 |
|
73 |
New (0, thr, 1, aio_thread); |
74 |
|
75 |
if (clone (aio_proc, |
76 |
&(thr->stack[STACKSIZE - 16]), |
77 |
CLONE_VM|CLONE_FS|CLONE_FILES, |
78 |
thr) >= 0) |
79 |
started++; |
80 |
else |
81 |
Safefree (thr); |
82 |
} |
83 |
|
84 |
static void |
85 |
send_reqs (void) |
86 |
{ |
87 |
/* this write is atomic */ |
88 |
while (qs && write (reqpipe[1], &qs, sizeof qs) == sizeof qs) |
89 |
{ |
90 |
qs = qs->next; |
91 |
if (!qs) qe = 0; |
92 |
} |
93 |
} |
94 |
|
95 |
static void |
96 |
send_req (aio_req req) |
97 |
{ |
98 |
nreqs++; |
99 |
req->next = 0; |
100 |
|
101 |
if (qe) |
102 |
{ |
103 |
qe->next = req; |
104 |
qe = req; |
105 |
} |
106 |
else |
107 |
qe = qs = req; |
108 |
|
109 |
send_reqs (); |
110 |
} |
111 |
|
112 |
static void |
113 |
end_thread (void) |
114 |
{ |
115 |
aio_req req; |
116 |
New (0, req, 1, aio_cb); |
117 |
req->type = REQ_QUIT; |
118 |
|
119 |
send_req (req); |
120 |
} |
121 |
|
122 |
static void |
123 |
read_write (pTHX_ |
124 |
int dowrite, int fd, off_t offset, size_t length, |
125 |
SV *data, STRLEN dataoffset, SV *callback) |
126 |
{ |
127 |
aio_req req; |
128 |
STRLEN svlen; |
129 |
char *svptr = SvPV (data, svlen); |
130 |
|
131 |
SvUPGRADE (data, SVt_PV); |
132 |
SvPOK_on (data); |
133 |
|
134 |
if (dataoffset < 0) |
135 |
dataoffset += svlen; |
136 |
|
137 |
if (dataoffset < 0 || dataoffset > svlen) |
138 |
croak ("data offset outside of string"); |
139 |
|
140 |
if (dowrite) |
141 |
{ |
142 |
/* write: check length and adjust. */ |
143 |
if (length < 0 || length + dataoffset > svlen) |
144 |
length = svlen - dataoffset; |
145 |
} |
146 |
else |
147 |
{ |
148 |
/* read: grow scalar as necessary */ |
149 |
svptr = SvGROW (data, length + dataoffset); |
150 |
} |
151 |
|
152 |
if (length < 0) |
153 |
croak ("length must not be negative"); |
154 |
|
155 |
Newz (0, req, 1, aio_cb); |
156 |
|
157 |
if (!req) |
158 |
croak ("out of memory during aio_req allocation"); |
159 |
|
160 |
req->type = dowrite ? REQ_WRITE : REQ_READ; |
161 |
req->fd = fd; |
162 |
req->offset = offset; |
163 |
req->length = length; |
164 |
req->data = SvREFCNT_inc (data); |
165 |
req->dataptr = (char *)svptr + dataoffset; |
166 |
req->callback = SvREFCNT_inc (callback); |
167 |
|
168 |
send_req (req); |
169 |
} |
170 |
|
171 |
static void |
172 |
poll_wait () |
173 |
{ |
174 |
fd_set rfd; |
175 |
FD_ZERO(&rfd); |
176 |
FD_SET(respipe[0], &rfd); |
177 |
|
178 |
select (respipe[0] + 1, &rfd, 0, 0, 0); |
179 |
} |
180 |
|
181 |
static int |
182 |
poll_cb (pTHX) |
183 |
{ |
184 |
dSP; |
185 |
int count = 0; |
186 |
aio_req req; |
187 |
|
188 |
while (read (respipe[0], (void *)&req, sizeof (req)) == sizeof (req)) |
189 |
{ |
190 |
nreqs--; |
191 |
|
192 |
if (req->type == REQ_QUIT) |
193 |
{ |
194 |
Safefree (req->thread); |
195 |
started--; |
196 |
} |
197 |
else |
198 |
{ |
199 |
int errorno = errno; |
200 |
errno = req->errorno; |
201 |
|
202 |
if (req->type == REQ_READ) |
203 |
SvCUR_set (req->data, req->dataoffset |
204 |
+ req->result > 0 ? req->result : 0); |
205 |
|
206 |
if (req->data) |
207 |
SvREFCNT_dec (req->data); |
208 |
|
209 |
if (req->type == REQ_STAT || req->type == REQ_LSTAT || req->type == REQ_FSTAT) |
210 |
{ |
211 |
PL_laststype = req->type == REQ_LSTAT ? OP_LSTAT : OP_STAT; |
212 |
PL_laststatval = req->result; |
213 |
PL_statcache = *(req->statdata); |
214 |
|
215 |
Safefree (req->statdata); |
216 |
} |
217 |
|
218 |
PUSHMARK (SP); |
219 |
XPUSHs (sv_2mortal (newSViv (req->result))); |
220 |
PUTBACK; |
221 |
call_sv (req->callback, G_VOID); |
222 |
SPAGAIN; |
223 |
|
224 |
if (req->callback) |
225 |
SvREFCNT_dec (req->callback); |
226 |
|
227 |
errno = errorno; |
228 |
count++; |
229 |
} |
230 |
|
231 |
Safefree (req); |
232 |
} |
233 |
|
234 |
if (qs) |
235 |
send_reqs (); |
236 |
|
237 |
return count; |
238 |
} |
239 |
|
240 |
static sigset_t fullsigset; |
241 |
|
242 |
#undef errno |
243 |
#include <asm/unistd.h> |
244 |
#include <linux/types.h> |
245 |
#include <sys/prctl.h> |
246 |
|
247 |
#if __alpha || __ia64 || __hppa || __v850__ |
248 |
# define stat kernelstat |
249 |
# define stat64 kernelstat64 |
250 |
# include <asm/stat.h> |
251 |
# undef stat |
252 |
# undef stat64 |
253 |
#else |
254 |
# define kernelstat stat |
255 |
# define kernelstat64 stat64 |
256 |
#endif |
257 |
|
258 |
#define COPY_STATDATA \ |
259 |
req->statdata->st_dev = statdata.st_dev; \ |
260 |
req->statdata->st_ino = statdata.st_ino; \ |
261 |
req->statdata->st_mode = statdata.st_mode; \ |
262 |
req->statdata->st_nlink = statdata.st_nlink; \ |
263 |
req->statdata->st_uid = statdata.st_uid; \ |
264 |
req->statdata->st_gid = statdata.st_gid; \ |
265 |
req->statdata->st_rdev = statdata.st_rdev; \ |
266 |
req->statdata->st_size = statdata.st_size; \ |
267 |
req->statdata->st_atime = statdata.st_atime; \ |
268 |
req->statdata->st_mtime = statdata.st_mtime; \ |
269 |
req->statdata->st_ctime = statdata.st_ctime; \ |
270 |
req->statdata->st_blksize = statdata.st_blksize; \ |
271 |
req->statdata->st_blocks = statdata.st_blocks; \ |
272 |
|
273 |
static int |
274 |
aio_proc (void *thr_arg) |
275 |
{ |
276 |
aio_thread *thr = thr_arg; |
277 |
aio_req req; |
278 |
int errno; |
279 |
|
280 |
/* this is very much kernel-specific :(:(:( */ |
281 |
/* we rely on gcc's ability to create closures. */ |
282 |
_syscall3(__kernel_size_t, read , unsigned int, fd, char *, buf, __kernel_size_t, count) |
283 |
_syscall3(__kernel_size_t, write, unsigned int, fd, char *, buf, __kernel_size_t, count) |
284 |
|
285 |
_syscall3(long, open, char *, pathname, int, flags, int, mode) |
286 |
_syscall1(long, close, unsigned int, fd) |
287 |
_syscall1(long, unlink, char *, filename); |
288 |
_syscall1(long, fsync, unsigned int, fd); |
289 |
|
290 |
#ifndef __NR_fdatasync |
291 |
# define __NR_fdatasync __NR_fsync |
292 |
#endif |
293 |
_syscall1(long, fdatasync, unsigned int, fd); |
294 |
|
295 |
#if BYTE_ORDER == LITTLE_ENDIAN |
296 |
# define LOFF_ARG(off) (off & 0xffffffff), (off >> 32) |
297 |
#elif BYTE_ORDER == BIG_ENDIAN |
298 |
# define LOFF_ARG(off) (off >> 32), (off & 0xffffffff) |
299 |
#endif |
300 |
|
301 |
#ifndef __NR_pread64 |
302 |
# define __NR_pread64 __NR_pread |
303 |
# define __NR_pwrite64 __NR_write |
304 |
#endif |
305 |
_syscall5(__kernel_ssize_t, pread64 , unsigned int, fd, char *, buf, |
306 |
__kernel_size_t, count, unsigned int, offset_lh, unsigned int, offset_hl) |
307 |
_syscall5(__kernel_ssize_t, pwrite64, unsigned int, fd, char *, buf, |
308 |
__kernel_size_t, count, unsigned int, offset_lh, unsigned int, offset_hl) |
309 |
_syscall4(long, readahead, unsigned int, fd, unsigned int, offset_lh, unsigned int, offset_hl, __kernel_size_t, count); |
310 |
|
311 |
#if __NR_stat64 |
312 |
_syscall2(long, stat64 , const char *, filename, struct kernelstat64 *, buf) |
313 |
_syscall2(long, lstat64, const char *, filename, struct kernelstat64 *, buf) |
314 |
_syscall2(long, fstat64, int , fd , struct kernelstat64 *, buf) |
315 |
#elif __NR_stat |
316 |
_syscall2(long, stat , const char *, filename, struct kernelstat *, buf) |
317 |
_syscall2(long, lstat, const char *, filename, struct kernelstat *, buf) |
318 |
_syscall2(long, fstat, int , fd , struct kernelstat *, buf) |
319 |
#else |
320 |
# error "neither stat64 nor stat defined" |
321 |
#endif |
322 |
|
323 |
/* the following two calls might clobber errno */ |
324 |
sigprocmask (SIG_SETMASK, &fullsigset, 0); |
325 |
prctl (PR_SET_PDEATHSIG, SIGKILL); |
326 |
|
327 |
/* then loop */ |
328 |
while (read (reqpipe[0], (void *)&req, sizeof (req)) == sizeof (req)) |
329 |
{ |
330 |
req->thread = thr; |
331 |
errno = 0; /* strictly unnecessary */ |
332 |
|
333 |
switch (req->type) |
334 |
{ |
335 |
case REQ_READ: req->result = pread64 (req->fd, req->dataptr, req->length, LOFF_ARG (req->offset)); break; |
336 |
case REQ_WRITE: req->result = pwrite64 (req->fd, req->dataptr, req->length, LOFF_ARG (req->offset)); break; |
337 |
case REQ_READAHEAD: req->result = readahead (req->fd, LOFF_ARG (req->offset), req->length); break; |
338 |
|
339 |
#if __NR_stat64 |
340 |
struct kernelstat64 statdata; |
341 |
case REQ_STAT: req->result = stat64 (req->dataptr, &statdata); COPY_STATDATA; break; |
342 |
case REQ_LSTAT: req->result = lstat64 (req->dataptr, &statdata); COPY_STATDATA; break; |
343 |
case REQ_FSTAT: req->result = fstat64 (req->fd , &statdata); COPY_STATDATA; break; |
344 |
#else |
345 |
struct kernelstat statdata; |
346 |
case REQ_STAT: req->result = stat (req->dataptr, &statdata); COPY_STATDATA; break; |
347 |
case REQ_LSTAT: req->result = lstat (req->dataptr, &statdata); COPY_STATDATA; break; |
348 |
case REQ_FSTAT: req->result = fstat (req->fd , &statdata); COPY_STATDATA; break; |
349 |
#endif |
350 |
|
351 |
case REQ_OPEN: req->result = open (req->dataptr, req->fd, req->mode); break; |
352 |
case REQ_CLOSE: req->result = close (req->fd); break; |
353 |
case REQ_UNLINK: req->result = unlink (req->dataptr); break; |
354 |
|
355 |
case REQ_FSYNC: req->result = fsync (req->fd); break; |
356 |
case REQ_FDATASYNC: req->result = fdatasync (req->fd); break; |
357 |
|
358 |
case REQ_QUIT: |
359 |
write (respipe[1], (void *)&req, sizeof (req)); |
360 |
return 0; |
361 |
|
362 |
default: |
363 |
req->result = ENOSYS; |
364 |
break; |
365 |
} |
366 |
|
367 |
req->errorno = errno; |
368 |
write (respipe[1], (void *)&req, sizeof (req)); |
369 |
} |
370 |
|
371 |
return 0; |
372 |
} |
373 |
|
374 |
MODULE = Linux::AIO PACKAGE = Linux::AIO |
375 |
|
376 |
BOOT: |
377 |
{ |
378 |
sigfillset (&fullsigset); |
379 |
sigdelset (&fullsigset, SIGTERM); |
380 |
sigdelset (&fullsigset, SIGQUIT); |
381 |
sigdelset (&fullsigset, SIGABRT); |
382 |
sigdelset (&fullsigset, SIGINT); |
383 |
|
384 |
if (pipe (reqpipe) || pipe (respipe)) |
385 |
croak ("unable to initialize request or result pipe"); |
386 |
|
387 |
if (fcntl (reqpipe[1], F_SETFL, O_NONBLOCK)) |
388 |
croak ("cannot set result pipe to nonblocking mode"); |
389 |
|
390 |
if (fcntl (respipe[0], F_SETFL, O_NONBLOCK)) |
391 |
croak ("cannot set result pipe to nonblocking mode"); |
392 |
} |
393 |
|
394 |
void |
395 |
min_parallel(nthreads) |
396 |
int nthreads |
397 |
PROTOTYPE: $ |
398 |
CODE: |
399 |
while (nthreads > started) |
400 |
start_thread (); |
401 |
|
402 |
void |
403 |
max_parallel(nthreads) |
404 |
int nthreads |
405 |
PROTOTYPE: $ |
406 |
CODE: |
407 |
{ |
408 |
int cur = started; |
409 |
while (cur > nthreads) |
410 |
{ |
411 |
end_thread (); |
412 |
cur--; |
413 |
} |
414 |
|
415 |
while (started > nthreads) |
416 |
{ |
417 |
poll_wait (); |
418 |
poll_cb (aTHX); |
419 |
} |
420 |
} |
421 |
|
422 |
void |
423 |
aio_open(pathname,flags,mode,callback) |
424 |
SV * pathname |
425 |
int flags |
426 |
int mode |
427 |
SV * callback |
428 |
PROTOTYPE: $$$$ |
429 |
CODE: |
430 |
{ |
431 |
aio_req req; |
432 |
|
433 |
Newz (0, req, 1, aio_cb); |
434 |
|
435 |
if (!req) |
436 |
croak ("out of memory during aio_req allocation"); |
437 |
|
438 |
req->type = REQ_OPEN; |
439 |
req->data = newSVsv (pathname); |
440 |
req->dataptr = SvPV_nolen (req->data); |
441 |
req->fd = flags; |
442 |
req->mode = mode; |
443 |
req->callback = SvREFCNT_inc (callback); |
444 |
|
445 |
send_req (req); |
446 |
} |
447 |
|
448 |
void |
449 |
aio_close(fh,callback) |
450 |
InputStream fh |
451 |
SV * callback |
452 |
PROTOTYPE: $$ |
453 |
ALIAS: |
454 |
aio_close = REQ_CLOSE |
455 |
aio_fsync = REQ_FSYNC |
456 |
aio_fdatasync = REQ_FDATASYNC |
457 |
CODE: |
458 |
{ |
459 |
aio_req req; |
460 |
|
461 |
Newz (0, req, 1, aio_cb); |
462 |
|
463 |
if (!req) |
464 |
croak ("out of memory during aio_req allocation"); |
465 |
|
466 |
req->type = ix; |
467 |
req->fd = PerlIO_fileno (fh); |
468 |
req->callback = SvREFCNT_inc (callback); |
469 |
|
470 |
send_req (req); |
471 |
} |
472 |
|
473 |
void |
474 |
aio_read(fh,offset,length,data,dataoffset,callback) |
475 |
InputStream fh |
476 |
UV offset |
477 |
IV length |
478 |
SV * data |
479 |
IV dataoffset |
480 |
SV * callback |
481 |
PROTOTYPE: $$$$$$ |
482 |
CODE: |
483 |
read_write (aTHX_ 0, PerlIO_fileno (fh), offset, length, data, dataoffset, callback); |
484 |
|
485 |
void |
486 |
aio_write(fh,offset,length,data,dataoffset,callback) |
487 |
OutputStream fh |
488 |
UV offset |
489 |
IV length |
490 |
SV * data |
491 |
IV dataoffset |
492 |
SV * callback |
493 |
PROTOTYPE: $$$$$$ |
494 |
CODE: |
495 |
read_write (aTHX_ 1, PerlIO_fileno (fh), offset, length, data, dataoffset, callback); |
496 |
|
497 |
void |
498 |
aio_readahead(fh,offset,length,callback) |
499 |
InputStream fh |
500 |
UV offset |
501 |
IV length |
502 |
SV * callback |
503 |
PROTOTYPE: $$$$ |
504 |
CODE: |
505 |
{ |
506 |
aio_req req; |
507 |
|
508 |
if (length < 0) |
509 |
croak ("length must not be negative"); |
510 |
|
511 |
Newz (0, req, 1, aio_cb); |
512 |
|
513 |
if (!req) |
514 |
croak ("out of memory during aio_req allocation"); |
515 |
|
516 |
req->type = REQ_READAHEAD; |
517 |
req->fd = PerlIO_fileno (fh); |
518 |
req->offset = offset; |
519 |
req->length = length; |
520 |
req->callback = SvREFCNT_inc (callback); |
521 |
|
522 |
send_req (req); |
523 |
} |
524 |
|
525 |
void |
526 |
aio_stat(fh_or_path,callback) |
527 |
SV * fh_or_path |
528 |
SV * callback |
529 |
PROTOTYPE: $$ |
530 |
ALIAS: |
531 |
aio_lstat = 1 |
532 |
CODE: |
533 |
{ |
534 |
aio_req req; |
535 |
|
536 |
Newz (0, req, 1, aio_cb); |
537 |
|
538 |
if (!req) |
539 |
croak ("out of memory during aio_req allocation"); |
540 |
|
541 |
New (0, req->statdata, 1, Stat_t); |
542 |
|
543 |
if (!req->statdata) |
544 |
croak ("out of memory during aio_req->statdata allocation"); |
545 |
|
546 |
if (SvPOK (fh_or_path)) |
547 |
{ |
548 |
req->type = ix ? REQ_LSTAT : REQ_STAT; |
549 |
req->data = newSVsv (fh_or_path); |
550 |
req->dataptr = SvPV_nolen (req->data); |
551 |
} |
552 |
else |
553 |
{ |
554 |
req->type = REQ_FSTAT; |
555 |
req->fd = PerlIO_fileno (IoIFP (sv_2io (fh_or_path))); |
556 |
} |
557 |
|
558 |
req->callback = SvREFCNT_inc (callback); |
559 |
|
560 |
send_req (req); |
561 |
} |
562 |
|
563 |
void |
564 |
aio_unlink(pathname,callback) |
565 |
SV * pathname |
566 |
SV * callback |
567 |
PROTOTYPE: $$ |
568 |
CODE: |
569 |
{ |
570 |
aio_req req; |
571 |
|
572 |
Newz (0, req, 1, aio_cb); |
573 |
|
574 |
if (!req) |
575 |
croak ("out of memory during aio_req allocation"); |
576 |
|
577 |
req->type = REQ_UNLINK; |
578 |
req->data = newSVsv (pathname); |
579 |
req->dataptr = SvPV_nolen (req->data); |
580 |
req->callback = SvREFCNT_inc (callback); |
581 |
|
582 |
send_req (req); |
583 |
} |
584 |
|
585 |
int |
586 |
poll_fileno() |
587 |
PROTOTYPE: |
588 |
CODE: |
589 |
RETVAL = respipe[0]; |
590 |
OUTPUT: |
591 |
RETVAL |
592 |
|
593 |
int |
594 |
poll_cb(...) |
595 |
PROTOTYPE: |
596 |
CODE: |
597 |
RETVAL = poll_cb (aTHX); |
598 |
OUTPUT: |
599 |
RETVAL |
600 |
|
601 |
void |
602 |
poll_wait() |
603 |
PROTOTYPE: |
604 |
CODE: |
605 |
poll_wait (); |
606 |
|
607 |
int |
608 |
nreqs() |
609 |
PROTOTYPE: |
610 |
CODE: |
611 |
RETVAL = nreqs; |
612 |
OUTPUT: |
613 |
RETVAL |
614 |
|