ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/libeio/eio.c
(Generate patch)

Comparing libeio/eio.c (file contents):
Revision 1.99 by root, Tue Jul 26 11:07:08 2011 UTC vs.
Revision 1.126 by root, Fri Dec 28 07:33:41 2012 UTC

1/* 1/*
2 * libeio implementation 2 * libeio implementation
3 * 3 *
4 * Copyright (c) 2007,2008,2009,2010,2011 Marc Alexander Lehmann <libeio@schmorp.de> 4 * Copyright (c) 2007,2008,2009,2010,2011,2012 Marc Alexander Lehmann <libeio@schmorp.de>
5 * All rights reserved. 5 * All rights reserved.
6 * 6 *
7 * Redistribution and use in source and binary forms, with or without modifica- 7 * Redistribution and use in source and binary forms, with or without modifica-
8 * tion, are permitted provided that the following conditions are met: 8 * tion, are permitted provided that the following conditions are met:
9 * 9 *
10 * 1. Redistributions of source code must retain the above copyright notice, 10 * 1. Redistributions of source code must retain the above copyright notice,
11 * this list of conditions and the following disclaimer. 11 * this list of conditions and the following disclaimer.
12 * 12 *
13 * 2. Redistributions in binary form must reproduce the above copyright 13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the 14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution. 15 * documentation and/or other materials provided with the distribution.
16 * 16 *
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED 17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
18 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MER- 18 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MER-
19 * CHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO 19 * CHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
20 * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPE- 20 * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPE-
21 * CIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 21 * CIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
43 43
44#include "eio.h" 44#include "eio.h"
45#include "ecb.h" 45#include "ecb.h"
46 46
47#ifdef EIO_STACKSIZE 47#ifdef EIO_STACKSIZE
48# define XTHREAD_STACKSIZE EIO_STACKSIZE 48# define X_STACKSIZE EIO_STACKSIZE
49#endif 49#endif
50#include "xthread.h" 50#include "xthread.h"
51 51
52#include <errno.h> 52#include <errno.h>
53#include <stddef.h> 53#include <stddef.h>
105#ifdef _WIN32 105#ifdef _WIN32
106 106
107 #undef PAGESIZE 107 #undef PAGESIZE
108 #define PAGESIZE 4096 /* GetSystemInfo? */ 108 #define PAGESIZE 4096 /* GetSystemInfo? */
109 109
110 /* TODO: look at how perl does stat (non-sloppy), unlink (ro-files), utime, link */
111
110 #ifdef EIO_STRUCT_STATI64 112 #ifdef EIO_STRUCT_STATI64
113 /* look at perl's non-sloppy stat */
111 #define stat(path,buf) _stati64 (path,buf) 114 #define stat(path,buf) _stati64 (path,buf)
112 #define fstat(fd,buf) _fstati64 (fd,buf) 115 #define fstat(fd,buf) _fstati64 (fd,buf)
113 #endif 116 #endif
114 #define lstat(path,buf) stat (path,buf) 117 #define lstat(path,buf) stat (path,buf)
115 #define fsync(fd) (FlushFileBuffers ((HANDLE)EIO_FD_TO_WIN32_HANDLE (fd)) ? 0 : EIO_ERRNO (EBADF, -1)) 118 #define fsync(fd) (FlushFileBuffers ((HANDLE)EIO_FD_TO_WIN32_HANDLE (fd)) ? 0 : EIO_ERRNO (EBADF, -1))
128 #define mknod(path,mode,dev) EIO_ENOSYS () 131 #define mknod(path,mode,dev) EIO_ENOSYS ()
129 #define sync() EIO_ENOSYS () 132 #define sync() EIO_ENOSYS ()
130 #define readlink(path,buf,s) EIO_ENOSYS () 133 #define readlink(path,buf,s) EIO_ENOSYS ()
131 #define statvfs(path,buf) EIO_ENOSYS () 134 #define statvfs(path,buf) EIO_ENOSYS ()
132 #define fstatvfs(fd,buf) EIO_ENOSYS () 135 #define fstatvfs(fd,buf) EIO_ENOSYS ()
136
137 #define pread(fd,buf,count,offset) eio__pread (fd, buf, count, offset)
138 #define pwrite(fd,buf,count,offset) eio__pwrite (fd, buf, count, offset)
139
140 #if __GNUC__
141 typedef long long eio_off_t; /* signed for compatibility to msvc */
142 #else
143 typedef __int64 eio_off_t; /* unsigned not supported by msvc */
144 #endif
145
146 static eio_ssize_t
147 eio__pread (int fd, void *buf, eio_ssize_t count, eio_off_t offset)
148 {
149 OVERLAPPED o = { 0 };
150 DWORD got;
151
152 o.Offset = offset;
153 o.OffsetHigh = offset >> 32;
154
155 return ReadFile ((HANDLE)EIO_FD_TO_WIN32_HANDLE (fd), buf, count, &got, &o)
156 ? got : -1;
157 }
158
159 static eio_ssize_t
160 eio__pwrite (int fd, void *buf, eio_ssize_t count, eio_off_t offset)
161 {
162 OVERLAPPED o = { 0 };
163 DWORD got;
164
165 o.Offset = offset;
166 o.OffsetHigh = offset >> 32;
167
168 return WriteFile ((HANDLE)EIO_FD_TO_WIN32_HANDLE (fd), buf, count, &got, &o)
169 ? got : -1;
170 }
133 171
134 /* rename() uses MoveFile, which fails to overwrite */ 172 /* rename() uses MoveFile, which fails to overwrite */
135 #define rename(old,neu) eio__rename (old, neu) 173 #define rename(old,neu) eio__rename (old, neu)
136 174
137 static int 175 static int
205 #endif 243 #endif
206 244
207 #define D_NAME(entp) entp->d_name 245 #define D_NAME(entp) entp->d_name
208 246
209 /* POSIX_SOURCE is useless on bsd's, and XOPEN_SOURCE is unreliable there, too */ 247 /* POSIX_SOURCE is useless on bsd's, and XOPEN_SOURCE is unreliable there, too */
210 #if __FreeBSD__ || defined __NetBSD__ || defined __OpenBSD__ 248 #if __FreeBSD__ || __NetBSD__ || __OpenBSD__
211 #define _DIRENT_HAVE_D_TYPE /* sigh */ 249 #define _DIRENT_HAVE_D_TYPE /* sigh */
212 #define D_INO(de) (de)->d_fileno 250 #define D_INO(de) (de)->d_fileno
213 #define D_NAMLEN(de) (de)->d_namlen 251 #define D_NAMLEN(de) (de)->d_namlen
214 #elif __linux || defined d_ino || _XOPEN_SOURCE >= 600 252 #elif __linux || defined d_ino || _XOPEN_SOURCE >= 600
215 #define D_INO(de) (de)->d_ino 253 #define D_INO(de) (de)->d_ino
278#endif 316#endif
279 317
280/* buffer size for various temporary buffers */ 318/* buffer size for various temporary buffers */
281#define EIO_BUFSIZE 65536 319#define EIO_BUFSIZE 65536
282 320
283#define dBUF \ 321#define dBUF \
284 char *eio_buf = malloc (EIO_BUFSIZE); \ 322 char *eio_buf = malloc (EIO_BUFSIZE); \
285 errno = ENOMEM; \ 323 errno = ENOMEM; \
286 if (!eio_buf) \ 324 if (!eio_buf) \
287 return -1 325 return -1
288 326
289#define FUBd \ 327#define FUBd \
290 free (eio_buf) 328 free (eio_buf)
291 329
292#define EIO_TICKS ((1000000 + 1023) >> 10) 330#define EIO_TICKS ((1000000 + 1023) >> 10)
331
332/*****************************************************************************/
333
334struct tmpbuf
335{
336 void *ptr;
337 int len;
338};
339
340static void *
341tmpbuf_get (struct tmpbuf *buf, int len)
342{
343 if (buf->len < len)
344 {
345 free (buf->ptr);
346 buf->ptr = malloc (buf->len = len);
347 }
348
349 return buf->ptr;
350}
351
352struct tmpbuf;
353
354#if _POSIX_VERSION >= 200809L
355 #define HAVE_AT 1
356 #define WD2FD(wd) ((wd) ? (wd)->fd : AT_FDCWD)
357 #ifndef O_SEARCH
358 #define O_SEARCH O_RDONLY
359 #endif
360#else
361 #define HAVE_AT 0
362 static const char *wd_expand (struct tmpbuf *tmpbuf, eio_wd wd, const char *path);
363#endif
364
365struct eio_pwd
366{
367#if HAVE_AT
368 int fd;
369#endif
370 int len;
371 char str[1]; /* actually, a 0-terminated canonical path */
372};
373
374/*****************************************************************************/
293 375
294#define ETP_PRI_MIN EIO_PRI_MIN 376#define ETP_PRI_MIN EIO_PRI_MIN
295#define ETP_PRI_MAX EIO_PRI_MAX 377#define ETP_PRI_MAX EIO_PRI_MAX
296 378
297struct etp_worker; 379struct etp_worker;
321static void (*done_poll_cb) (void); 403static void (*done_poll_cb) (void);
322 404
323static unsigned int max_poll_time; /* reslock */ 405static unsigned int max_poll_time; /* reslock */
324static unsigned int max_poll_reqs; /* reslock */ 406static unsigned int max_poll_reqs; /* reslock */
325 407
326static volatile unsigned int nreqs; /* reqlock */ 408static unsigned int nreqs; /* reqlock */
327static volatile unsigned int nready; /* reqlock */ 409static unsigned int nready; /* reqlock */
328static volatile unsigned int npending; /* reqlock */ 410static unsigned int npending; /* reqlock */
329static volatile unsigned int max_idle = 4; /* maximum number of threads that can idle indefinitely */ 411static unsigned int max_idle = 4; /* maximum number of threads that can idle indefinitely */
330static volatile unsigned int idle_timeout = 10; /* number of seconds after which an idle threads exit */ 412static unsigned int idle_timeout = 10; /* number of seconds after which an idle threads exit */
331 413
332static xmutex_t wrklock; 414static xmutex_t wrklock;
333static xmutex_t reslock; 415static xmutex_t reslock;
334static xmutex_t reqlock; 416static xmutex_t reqlock;
335static xcond_t reqwait; 417static xcond_t reqwait;
336 418
337#if !HAVE_PREADWRITE
338/*
339 * make our pread/pwrite emulation safe against themselves, but not against
340 * normal read/write by using a mutex. slows down execution a lot,
341 * but that's your problem, not mine.
342 */
343static xmutex_t preadwritelock;
344#endif
345
346typedef struct etp_worker 419typedef struct etp_worker
347{ 420{
421 struct tmpbuf tmpbuf;
422
348 /* locked by wrklock */ 423 /* locked by wrklock */
349 struct etp_worker *prev, *next; 424 struct etp_worker *prev, *next;
350 425
351 xthread_t tid; 426 xthread_t tid;
352 427
353 /* locked by reslock, reqlock or wrklock */
354 ETP_REQ *req; /* currently processed request */
355
356#ifdef ETP_WORKER_COMMON 428#ifdef ETP_WORKER_COMMON
357 ETP_WORKER_COMMON 429 ETP_WORKER_COMMON
358#endif 430#endif
359} etp_worker; 431} etp_worker;
360 432
363#define ETP_WORKER_LOCK(wrk) X_LOCK (wrklock) 435#define ETP_WORKER_LOCK(wrk) X_LOCK (wrklock)
364#define ETP_WORKER_UNLOCK(wrk) X_UNLOCK (wrklock) 436#define ETP_WORKER_UNLOCK(wrk) X_UNLOCK (wrklock)
365 437
366/* worker threads management */ 438/* worker threads management */
367 439
368static void ecb_cold 440static void
369etp_worker_clear (etp_worker *wrk) 441etp_worker_clear (etp_worker *wrk)
370{ 442{
371} 443}
372 444
373static void ecb_cold 445static void ecb_cold
374etp_worker_free (etp_worker *wrk) 446etp_worker_free (etp_worker *wrk)
375{ 447{
448 free (wrk->tmpbuf.ptr);
449
376 wrk->next->prev = wrk->prev; 450 wrk->next->prev = wrk->prev;
377 wrk->prev->next = wrk->next; 451 wrk->prev->next = wrk->next;
378 452
379 free (wrk); 453 free (wrk);
380} 454}
528 /*TODO*/ 602 /*TODO*/
529 assert (("unable to allocate worker thread data", wrk)); 603 assert (("unable to allocate worker thread data", wrk));
530 604
531 X_LOCK (wrklock); 605 X_LOCK (wrklock);
532 606
533 if (thread_create (&wrk->tid, etp_proc, (void *)wrk)) 607 if (xthread_create (&wrk->tid, etp_proc, (void *)wrk))
534 { 608 {
535 wrk->prev = &wrk_first; 609 wrk->prev = &wrk_first;
536 wrk->next = wrk_first.next; 610 wrk->next = wrk_first.next;
537 wrk_first.next->prev = wrk; 611 wrk_first.next->prev = wrk;
538 wrk_first.next = wrk; 612 wrk_first.next = wrk;
558} 632}
559 633
560static void ecb_cold 634static void ecb_cold
561etp_end_thread (void) 635etp_end_thread (void)
562{ 636{
563 eio_req *req = calloc (1, sizeof (eio_req)); 637 eio_req *req = calloc (1, sizeof (eio_req)); /* will be freed by worker */
564 638
565 req->type = -1; 639 req->type = -1;
566 req->pri = ETP_PRI_MAX - ETP_PRI_MIN; 640 req->pri = ETP_PRI_MAX - ETP_PRI_MIN;
567 641
568 X_LOCK (reqlock); 642 X_LOCK (reqlock);
895} 969}
896 970
897/*****************************************************************************/ 971/*****************************************************************************/
898/* work around various missing functions */ 972/* work around various missing functions */
899 973
900#if !HAVE_PREADWRITE
901# undef pread
902# undef pwrite
903# define pread eio__pread
904# define pwrite eio__pwrite
905
906static eio_ssize_t
907eio__pread (int fd, void *buf, size_t count, off_t offset)
908{
909 eio_ssize_t res;
910 off_t ooffset;
911
912 X_LOCK (preadwritelock);
913 ooffset = lseek (fd, 0, SEEK_CUR);
914 lseek (fd, offset, SEEK_SET);
915 res = read (fd, buf, count);
916 lseek (fd, ooffset, SEEK_SET);
917 X_UNLOCK (preadwritelock);
918
919 return res;
920}
921
922static eio_ssize_t
923eio__pwrite (int fd, void *buf, size_t count, off_t offset)
924{
925 eio_ssize_t res;
926 off_t ooffset;
927
928 X_LOCK (preadwritelock);
929 ooffset = lseek (fd, 0, SEEK_CUR);
930 lseek (fd, offset, SEEK_SET);
931 res = write (fd, buf, count);
932 lseek (fd, ooffset, SEEK_SET);
933 X_UNLOCK (preadwritelock);
934
935 return res;
936}
937#endif
938
939#ifndef HAVE_UTIMES 974#ifndef HAVE_UTIMES
940 975
941# undef utimes 976# undef utimes
942# define utimes(path,times) eio__utimes (path, times) 977# define utimes(path,times) eio__utimes (path, times)
943 978
984 int res; 1019 int res;
985 1020
986#if HAVE_SYS_SYNCFS 1021#if HAVE_SYS_SYNCFS
987 res = (int)syscall (__NR_syncfs, (int)(fd)); 1022 res = (int)syscall (__NR_syncfs, (int)(fd));
988#else 1023#else
989 res = -1; 1024 res = EIO_ENOSYS ();
990 errno = ENOSYS;
991#endif 1025#endif
992 1026
993 if (res < 0 && errno == ENOSYS && fd >= 0) 1027 if (res < 0 && errno == ENOSYS && fd >= 0)
994 sync (); 1028 sync ();
995 1029
1025} 1059}
1026 1060
1027static int 1061static int
1028eio__fallocate (int fd, int mode, off_t offset, size_t len) 1062eio__fallocate (int fd, int mode, off_t offset, size_t len)
1029{ 1063{
1030#if HAVE_FALLOCATE 1064#if HAVE_LINUX_FALLOCATE
1031 return fallocate (fd, mode, offset, len); 1065 return fallocate (fd, mode, offset, len);
1032#else 1066#else
1033 errno = ENOSYS; 1067 return EIO_ENOSYS ();
1034 return -1;
1035#endif 1068#endif
1036} 1069}
1037 1070
1038#if !HAVE_READAHEAD 1071#if !HAVE_READAHEAD
1039# undef readahead 1072# undef readahead
1054 todo -= len; 1087 todo -= len;
1055 } 1088 }
1056 1089
1057 FUBd; 1090 FUBd;
1058 1091
1059 errno = 0; 1092 /* linux's readahead basically only fails for EBADF or EINVAL (not mmappable) */
1093 /* but not for e.g. EIO or eof, so we also never fail */
1060 return count; 1094 return 0;
1061} 1095}
1062 1096
1063#endif 1097#endif
1064 1098
1065/* sendfile always needs emulation */ 1099/* sendfile always needs emulation */
1100 1134
1101 /* according to source inspection, this is correct, and useful behaviour */ 1135 /* according to source inspection, this is correct, and useful behaviour */
1102 if (sbytes) 1136 if (sbytes)
1103 res = sbytes; 1137 res = sbytes;
1104 1138
1105# elif defined (__APPLE__) 1139# elif defined __APPLE__
1106 off_t sbytes = count; 1140 off_t sbytes = count;
1107 res = sendfile (ifd, ofd, offset, &sbytes, 0, 0); 1141 res = sendfile (ifd, ofd, offset, &sbytes, 0, 0);
1108 1142
1109 /* according to the manpage, sbytes is always valid */ 1143 /* according to the manpage, sbytes is always valid */
1110 if (sbytes) 1144 if (sbytes)
1137 HANDLE h = TO_SOCKET (ifd); 1171 HANDLE h = TO_SOCKET (ifd);
1138 SetFilePointer (h, offset, 0, FILE_BEGIN); 1172 SetFilePointer (h, offset, 0, FILE_BEGIN);
1139 res = TransmitFile (TO_SOCKET (ofd), h, count, 0, 0, 0, 0); 1173 res = TransmitFile (TO_SOCKET (ofd), h, count, 0, 0, 0, 0);
1140 1174
1141#else 1175#else
1142 res = -1; 1176 res = EIO_ENOSYS ();
1143 errno = ENOSYS;
1144#endif 1177#endif
1145 1178
1146 /* we assume sendfile can copy at least 128mb in one go */ 1179 /* we assume sendfile can copy at least 128mb in one go */
1147 if (res <= 128 * 1024 * 1024) 1180 if (res <= 128 * 1024 * 1024)
1148 { 1181 {
1335 1368
1336/*****************************************************************************/ 1369/*****************************************************************************/
1337/* requests implemented outside eio_execute, because they are so large */ 1370/* requests implemented outside eio_execute, because they are so large */
1338 1371
1339static void 1372static void
1340eio__realpath (eio_req *req, etp_worker *self) 1373eio__lseek (eio_req *req)
1341{ 1374{
1342 char *rel = req->ptr1; 1375 /* this usually gets optimised away completely, or your compiler sucks, */
1376 /* or the whence constants really are not 0, 1, 2 */
1377 int whence = req->int2 == EIO_SEEK_SET ? SEEK_SET
1378 : req->int2 == EIO_SEEK_CUR ? SEEK_CUR
1379 : req->int2 == EIO_SEEK_END ? SEEK_END
1380 : req->int2;
1381
1382 req->offs = lseek (req->int1, req->offs, whence);
1383 req->result = req->offs == (off_t)-1 ? -1 : 0;
1384}
1385
1386/* result will always end up in tmpbuf, there is always space for adding a 0-byte */
1387static int
1388eio__realpath (struct tmpbuf *tmpbuf, eio_wd wd, const char *path)
1389{
1390 const char *rel = path;
1343 char *res; 1391 char *res;
1344 char *tmp1, *tmp2; 1392 char *tmp1, *tmp2;
1345#if SYMLOOP_MAX > 32 1393#if SYMLOOP_MAX > 32
1346 int symlinks = SYMLOOP_MAX; 1394 int symlinks = SYMLOOP_MAX;
1347#else 1395#else
1348 int symlinks = 32; 1396 int symlinks = 32;
1349#endif 1397#endif
1350 1398
1351 req->result = -1;
1352
1353 errno = EINVAL; 1399 errno = EINVAL;
1354 if (!rel) 1400 if (!rel)
1355 return; 1401 return -1;
1356 1402
1357 errno = ENOENT; 1403 errno = ENOENT;
1358 if (!*rel) 1404 if (!*rel)
1359 return; 1405 return -1;
1360 1406
1361 if (!req->ptr2) 1407 res = tmpbuf_get (tmpbuf, PATH_MAX * 3);
1362 {
1363 X_LOCK (wrklock);
1364 req->flags |= EIO_FLAG_PTR2_FREE;
1365 X_UNLOCK (wrklock);
1366 req->ptr2 = malloc (PATH_MAX * 3);
1367
1368 errno = ENOMEM;
1369 if (!req->ptr2)
1370 return;
1371 }
1372
1373 res = req->ptr2;
1374 tmp1 = res + PATH_MAX; 1408 tmp1 = res + PATH_MAX;
1375 tmp2 = tmp1 + PATH_MAX; 1409 tmp2 = tmp1 + PATH_MAX;
1376 1410
1377#if 0 /* disabled, the musl way to do things is just too racy */ 1411#if 0 /* disabled, the musl way to do things is just too racy */
1378#if __linux && defined(O_NONBLOCK) && defined(O_NOATIME) 1412#if __linux && defined(O_NONBLOCK) && defined(O_NOATIME)
1382 1416
1383 if (fd >= 0) 1417 if (fd >= 0)
1384 { 1418 {
1385 sprintf (tmp1, "/proc/self/fd/%d", fd); 1419 sprintf (tmp1, "/proc/self/fd/%d", fd);
1386 req->result = readlink (tmp1, res, PATH_MAX); 1420 req->result = readlink (tmp1, res, PATH_MAX);
1421 /* here we should probably stat the open file and the disk file, to make sure they still match */
1387 close (fd); 1422 close (fd);
1388
1389 /* here we should probably stat the open file and the disk file, to make sure they still match */
1390 1423
1391 if (req->result > 0) 1424 if (req->result > 0)
1392 goto done; 1425 goto done;
1393 } 1426 }
1394 else if (errno == ELOOP || errno == ENAMETOOLONG || errno == ENOENT || errno == ENOTDIR || errno == EIO) 1427 else if (errno == ELOOP || errno == ENAMETOOLONG || errno == ENOENT || errno == ENOTDIR || errno == EIO)
1395 return; 1428 return -1;
1396 } 1429 }
1397#endif 1430#endif
1398#endif 1431#endif
1399 1432
1400 if (*rel != '/') 1433 if (*rel != '/')
1401 { 1434 {
1435 int len;
1436
1437 errno = ENOENT;
1438 if (wd == EIO_INVALID_WD)
1439 return -1;
1440
1441 if (wd == EIO_CWD)
1442 {
1402 if (!getcwd (res, PATH_MAX)) 1443 if (!getcwd (res, PATH_MAX))
1403 return; 1444 return -1;
1445
1446 len = strlen (res);
1447 }
1448 else
1449 memcpy (res, wd->str, len = wd->len);
1404 1450
1405 if (res [1]) /* only use if not / */ 1451 if (res [1]) /* only use if not / */
1406 res += strlen (res); 1452 res += len;
1407 } 1453 }
1408 1454
1409 while (*rel) 1455 while (*rel)
1410 { 1456 {
1411 eio_ssize_t len, linklen; 1457 eio_ssize_t len, linklen;
1412 char *beg = rel; 1458 const char *beg = rel;
1413 1459
1414 while (*rel && *rel != '/') 1460 while (*rel && *rel != '/')
1415 ++rel; 1461 ++rel;
1416 1462
1417 len = rel - beg; 1463 len = rel - beg;
1429 1475
1430 if (beg [1] == '.' && len == 2) 1476 if (beg [1] == '.' && len == 2)
1431 { 1477 {
1432 /* .. - back up one component, if possible */ 1478 /* .. - back up one component, if possible */
1433 1479
1434 while (res != req->ptr2) 1480 while (res != tmpbuf->ptr)
1435 if (*--res == '/') 1481 if (*--res == '/')
1436 break; 1482 break;
1437 1483
1438 continue; 1484 continue;
1439 } 1485 }
1440 } 1486 }
1441 1487
1442 errno = ENAMETOOLONG; 1488 errno = ENAMETOOLONG;
1443 if (res + 1 + len + 1 >= tmp1) 1489 if (res + 1 + len + 1 >= tmp1)
1444 return; 1490 return -1;
1445 1491
1446 /* copy one component */ 1492 /* copy one component */
1447 *res = '/'; 1493 *res = '/';
1448 memcpy (res + 1, beg, len); 1494 memcpy (res + 1, beg, len);
1449 1495
1450 /* zero-terminate, for readlink */ 1496 /* zero-terminate, for readlink */
1451 res [len + 1] = 0; 1497 res [len + 1] = 0;
1452 1498
1453 /* now check if it's a symlink */ 1499 /* now check if it's a symlink */
1454 linklen = readlink (req->ptr2, tmp1, PATH_MAX); 1500 linklen = readlink (tmpbuf->ptr, tmp1, PATH_MAX);
1455 1501
1456 if (linklen < 0) 1502 if (linklen < 0)
1457 { 1503 {
1458 if (errno != EINVAL) 1504 if (errno != EINVAL)
1459 return; 1505 return -1;
1460 1506
1461 /* it's a normal directory. hopefully */ 1507 /* it's a normal directory. hopefully */
1462 res += len + 1; 1508 res += len + 1;
1463 } 1509 }
1464 else 1510 else
1466 /* yay, it was a symlink - build new path in tmp2 */ 1512 /* yay, it was a symlink - build new path in tmp2 */
1467 int rellen = strlen (rel); 1513 int rellen = strlen (rel);
1468 1514
1469 errno = ENAMETOOLONG; 1515 errno = ENAMETOOLONG;
1470 if (linklen + 1 + rellen >= PATH_MAX) 1516 if (linklen + 1 + rellen >= PATH_MAX)
1471 return; 1517 return -1;
1472 1518
1473 errno = ELOOP; 1519 errno = ELOOP;
1474 if (!--symlinks) 1520 if (!--symlinks)
1475 return; 1521 return -1;
1476 1522
1477 if (*tmp1 == '/') 1523 if (*tmp1 == '/')
1478 res = req->ptr2; /* symlink resolves to an absolute path */ 1524 res = tmpbuf->ptr; /* symlink resolves to an absolute path */
1479 1525
1480 /* we need to be careful, as rel might point into tmp2 already */ 1526 /* we need to be careful, as rel might point into tmp2 already */
1481 memmove (tmp2 + linklen + 1, rel, rellen + 1); 1527 memmove (tmp2 + linklen + 1, rel, rellen + 1);
1482 tmp2 [linklen] = '/'; 1528 tmp2 [linklen] = '/';
1483 memcpy (tmp2, tmp1, linklen); 1529 memcpy (tmp2, tmp1, linklen);
1485 rel = tmp2; 1531 rel = tmp2;
1486 } 1532 }
1487 } 1533 }
1488 1534
1489 /* special case for the lone root path */ 1535 /* special case for the lone root path */
1490 if (res == req->ptr2) 1536 if (res == tmpbuf->ptr)
1491 *res++ = '/'; 1537 *res++ = '/';
1492 1538
1493 req->result = res - (char *)req->ptr2; 1539 return res - (char *)tmpbuf->ptr;
1494
1495done:
1496 req->ptr2 = realloc (req->ptr2, req->result); /* trade time for space savings */
1497} 1540}
1498 1541
1499static signed char 1542static signed char
1500eio_dent_cmp (const eio_dirent *a, const eio_dirent *b) 1543eio_dent_cmp (const eio_dirent *a, const eio_dirent *b)
1501{ 1544{
1689#ifdef _WIN32 1732#ifdef _WIN32
1690 { 1733 {
1691 int len = strlen ((const char *)req->ptr1); 1734 int len = strlen ((const char *)req->ptr1);
1692 char *path = malloc (MAX_PATH); 1735 char *path = malloc (MAX_PATH);
1693 const char *fmt; 1736 const char *fmt;
1737 const char *reqpath = wd_expand (&self->tmpbuf, req->wd, req->ptr1);
1694 1738
1695 if (!len) 1739 if (!len)
1696 fmt = "./*"; 1740 fmt = "./*";
1697 else if (((const char *)req->ptr1)[len - 1] == '/' || ((const char *)req->ptr1)[len - 1] == '\\') 1741 else if (reqpath[len - 1] == '/' || reqpath[len - 1] == '\\')
1698 fmt = "%s*"; 1742 fmt = "%s*";
1699 else 1743 else
1700 fmt = "%s/*"; 1744 fmt = "%s/*";
1701 1745
1702 _snprintf (path, MAX_PATH, fmt, (const char *)req->ptr1); 1746 _snprintf (path, MAX_PATH, fmt, reqpath);
1703 dirp = FindFirstFile (path, &entp); 1747 dirp = FindFirstFile (path, &entp);
1704 free (path); 1748 free (path);
1705 1749
1706 if (dirp == INVALID_HANDLE_VALUE) 1750 if (dirp == INVALID_HANDLE_VALUE)
1707 { 1751 {
1708 dirp = 0;
1709
1710 /* should steal _dosmaperr */ 1752 /* should steal _dosmaperr */
1711 switch (GetLastError ()) 1753 switch (GetLastError ())
1712 { 1754 {
1713 case ERROR_FILE_NOT_FOUND: 1755 case ERROR_FILE_NOT_FOUND:
1714 req->result = 0; 1756 req->result = 0;
1715 break; 1757 break;
1716 1758
1717 case ERROR_INVALID_NAME: 1759 case ERROR_INVALID_NAME:
1718 case ERROR_PATH_NOT_FOUND: 1760 case ERROR_PATH_NOT_FOUND:
1719 case ERROR_NO_MORE_FILES: 1761 case ERROR_NO_MORE_FILES:
1720 errno = ENOENT; 1762 errno = ENOENT;
1721 break; 1763 break;
1722 1764
1723 case ERROR_NOT_ENOUGH_MEMORY: 1765 case ERROR_NOT_ENOUGH_MEMORY:
1724 errno = ENOMEM; 1766 errno = ENOMEM;
1725 break; 1767 break;
1726 1768
1727 default: 1769 default:
1728 errno = EINVAL; 1770 errno = EINVAL;
1729 break; 1771 break;
1730 } 1772 }
1773
1774 return;
1731 } 1775 }
1732 } 1776 }
1733#else 1777#else
1778 #if HAVE_AT
1779 if (req->wd)
1780 {
1781 int fd = openat (WD2FD (req->wd), req->ptr1, O_CLOEXEC | O_SEARCH | O_DIRECTORY);
1782
1783 if (fd < 0)
1784 return;
1785
1786 dirp = fdopendir (fd);
1787
1788 if (!dirp)
1789 close (fd);
1790 }
1791 else
1734 dirp = opendir (req->ptr1); 1792 dirp = opendir (req->ptr1);
1793 #else
1794 dirp = opendir (wd_expand (&self->tmpbuf, req->wd, req->ptr1));
1795 #endif
1796
1797 if (!dirp)
1798 return;
1735#endif 1799#endif
1736 1800
1737 if (req->flags & EIO_FLAG_PTR1_FREE) 1801 if (req->flags & EIO_FLAG_PTR1_FREE)
1738 free (req->ptr1); 1802 free (req->ptr1);
1739 1803
1740 req->flags |= EIO_FLAG_PTR1_FREE | EIO_FLAG_PTR2_FREE; 1804 req->flags |= EIO_FLAG_PTR1_FREE | EIO_FLAG_PTR2_FREE;
1741 req->ptr1 = dents = flags ? malloc (dentalloc * sizeof (eio_dirent)) : 0; 1805 req->ptr1 = dents = flags ? malloc (dentalloc * sizeof (eio_dirent)) : 0;
1742 req->ptr2 = names = malloc (namesalloc); 1806 req->ptr2 = names = malloc (namesalloc);
1743 1807
1744 if (dirp && names && (!flags || dents)) 1808 if (!names || (flags && !dents))
1809 return;
1810
1745 for (;;) 1811 for (;;)
1746 { 1812 {
1747 int done; 1813 int done;
1748 1814
1749#ifdef _WIN32 1815#ifdef _WIN32
1750 done = !dirp; 1816 done = !dirp;
1751#else 1817#else
1752 errno = 0; 1818 errno = 0;
1753 entp = readdir (dirp); 1819 entp = readdir (dirp);
1754 done = !entp; 1820 done = !entp;
1755#endif 1821#endif
1756 1822
1757 if (done) 1823 if (done)
1758 { 1824 {
1759#ifndef _WIN32 1825#ifndef _WIN32
1760 int old_errno = errno; 1826 int old_errno = errno;
1761 closedir (dirp); 1827 closedir (dirp);
1762 errno = old_errno; 1828 errno = old_errno;
1763 1829
1764 if (errno) 1830 if (errno)
1765 break; 1831 break;
1766#endif 1832#endif
1767 1833
1768 /* sort etc. */ 1834 /* sort etc. */
1769 req->int1 = flags; 1835 req->int1 = flags;
1770 req->result = dentoffs; 1836 req->result = dentoffs;
1771 1837
1772 if (flags & EIO_READDIR_STAT_ORDER) 1838 if (flags & EIO_READDIR_STAT_ORDER)
1773 eio_dent_sort (dents, dentoffs, flags & EIO_READDIR_DIRS_FIRST ? 7 : 0, inode_bits); 1839 eio_dent_sort (dents, dentoffs, flags & EIO_READDIR_DIRS_FIRST ? 7 : 0, inode_bits);
1774 else if (flags & EIO_READDIR_DIRS_FIRST) 1840 else if (flags & EIO_READDIR_DIRS_FIRST)
1775 if (flags & EIO_READDIR_FOUND_UNKNOWN) 1841 if (flags & EIO_READDIR_FOUND_UNKNOWN)
1776 eio_dent_sort (dents, dentoffs, 7, inode_bits); /* sort by score and inode */ 1842 eio_dent_sort (dents, dentoffs, 7, inode_bits); /* sort by score and inode */
1777 else 1843 else
1844 {
1845 /* in this case, all is known, and we just put dirs first and sort them */
1846 eio_dirent *oth = dents + dentoffs;
1847 eio_dirent *dir = dents;
1848
1849 /* now partition dirs to the front, and non-dirs to the back */
1850 /* by walking from both sides and swapping if necessary */
1851 while (oth > dir)
1852 {
1853 if (dir->type == EIO_DT_DIR)
1854 ++dir;
1855 else if ((--oth)->type == EIO_DT_DIR)
1856 {
1857 eio_dirent tmp = *dir; *dir = *oth; *oth = tmp;
1858
1859 ++dir;
1860 }
1861 }
1862
1863 /* now sort the dirs only (dirs all have the same score) */
1864 eio_dent_sort (dents, dir - dents, 0, inode_bits);
1865 }
1866
1867 break;
1868 }
1869
1870 /* now add the entry to our list(s) */
1871 name = D_NAME (entp);
1872
1873 /* skip . and .. entries */
1874 if (name [0] != '.' || (name [1] && (name [1] != '.' || name [2])))
1875 {
1876 int len = D_NAMLEN (entp) + 1;
1877
1878 while (ecb_expect_false (namesoffs + len > namesalloc))
1879 {
1880 namesalloc *= 2;
1881 req->ptr2 = names = realloc (names, namesalloc);
1882
1883 if (!names)
1884 break;
1885 }
1886
1887 memcpy (names + namesoffs, name, len);
1888
1889 if (dents)
1890 {
1891 struct eio_dirent *ent;
1892
1893 if (ecb_expect_false (dentoffs == dentalloc))
1778 { 1894 {
1779 /* in this case, all is known, and we just put dirs first and sort them */ 1895 dentalloc *= 2;
1896 req->ptr1 = dents = realloc (dents, dentalloc * sizeof (eio_dirent));
1897
1898 if (!dents)
1899 break;
1900 }
1901
1780 eio_dirent *oth = dents + dentoffs; 1902 ent = dents + dentoffs;
1781 eio_dirent *dir = dents;
1782 1903
1783 /* now partition dirs to the front, and non-dirs to the back */ 1904 ent->nameofs = namesoffs; /* rather dirtily we store the offset in the pointer */
1784 /* by walking from both sides and swapping if necessary */ 1905 ent->namelen = len - 1;
1785 while (oth > dir) 1906 ent->inode = D_INO (entp);
1907
1908 inode_bits |= ent->inode;
1909
1910 switch (D_TYPE (entp))
1911 {
1912 default:
1913 ent->type = EIO_DT_UNKNOWN;
1914 flags |= EIO_READDIR_FOUND_UNKNOWN;
1915 break;
1916
1917 #ifdef DT_FIFO
1918 case DT_FIFO: ent->type = EIO_DT_FIFO; break;
1919 #endif
1920 #ifdef DT_CHR
1921 case DT_CHR: ent->type = EIO_DT_CHR; break;
1922 #endif
1923 #ifdef DT_MPC
1924 case DT_MPC: ent->type = EIO_DT_MPC; break;
1925 #endif
1926 #ifdef DT_DIR
1927 case DT_DIR: ent->type = EIO_DT_DIR; break;
1928 #endif
1929 #ifdef DT_NAM
1930 case DT_NAM: ent->type = EIO_DT_NAM; break;
1931 #endif
1932 #ifdef DT_BLK
1933 case DT_BLK: ent->type = EIO_DT_BLK; break;
1934 #endif
1935 #ifdef DT_MPB
1936 case DT_MPB: ent->type = EIO_DT_MPB; break;
1937 #endif
1938 #ifdef DT_REG
1939 case DT_REG: ent->type = EIO_DT_REG; break;
1940 #endif
1941 #ifdef DT_NWK
1942 case DT_NWK: ent->type = EIO_DT_NWK; break;
1943 #endif
1944 #ifdef DT_CMP
1945 case DT_CMP: ent->type = EIO_DT_CMP; break;
1946 #endif
1947 #ifdef DT_LNK
1948 case DT_LNK: ent->type = EIO_DT_LNK; break;
1949 #endif
1950 #ifdef DT_SOCK
1951 case DT_SOCK: ent->type = EIO_DT_SOCK; break;
1952 #endif
1953 #ifdef DT_DOOR
1954 case DT_DOOR: ent->type = EIO_DT_DOOR; break;
1955 #endif
1956 #ifdef DT_WHT
1957 case DT_WHT: ent->type = EIO_DT_WHT; break;
1958 #endif
1959 }
1960
1961 ent->score = 7;
1962
1963 if (flags & EIO_READDIR_DIRS_FIRST)
1964 {
1965 if (ent->type == EIO_DT_UNKNOWN)
1786 { 1966 {
1787 if (dir->type == EIO_DT_DIR) 1967 if (*name == '.') /* leading dots are likely directories, and, in any case, rare */
1788 ++dir; 1968 ent->score = 1;
1789 else if ((--oth)->type == EIO_DT_DIR) 1969 else if (!strchr (name, '.')) /* absence of dots indicate likely dirs */
1790 { 1970 ent->score = len <= 2 ? 4 - len : len <= 4 ? 4 : len <= 7 ? 5 : 6; /* shorter == more likely dir, but avoid too many classes */
1791 eio_dirent tmp = *dir; *dir = *oth; *oth = tmp;
1792
1793 ++dir;
1794 }
1795 } 1971 }
1796 1972 else if (ent->type == EIO_DT_DIR)
1797 /* now sort the dirs only (dirs all have the same score) */ 1973 ent->score = 0;
1798 eio_dent_sort (dents, dir - dents, 0, inode_bits);
1799 } 1974 }
1800
1801 break;
1802 }
1803
1804 /* now add the entry to our list(s) */
1805 name = D_NAME (entp);
1806
1807 /* skip . and .. entries */
1808 if (name [0] != '.' || (name [1] && (name [1] != '.' || name [2])))
1809 {
1810 int len = D_NAMLEN (entp) + 1;
1811
1812 while (ecb_expect_false (namesoffs + len > namesalloc))
1813 {
1814 namesalloc *= 2;
1815 req->ptr2 = names = realloc (names, namesalloc);
1816
1817 if (!names)
1818 break;
1819 } 1975 }
1820 1976
1821 memcpy (names + namesoffs, name, len);
1822
1823 if (dents)
1824 {
1825 struct eio_dirent *ent;
1826
1827 if (ecb_expect_false (dentoffs == dentalloc))
1828 {
1829 dentalloc *= 2;
1830 req->ptr1 = dents = realloc (dents, dentalloc * sizeof (eio_dirent));
1831
1832 if (!dents)
1833 break;
1834 }
1835
1836 ent = dents + dentoffs;
1837
1838 ent->nameofs = namesoffs; /* rather dirtily we store the offset in the pointer */
1839 ent->namelen = len - 1;
1840 ent->inode = D_INO (entp);
1841
1842 inode_bits |= ent->inode;
1843
1844 switch (D_TYPE (entp))
1845 {
1846 default:
1847 ent->type = EIO_DT_UNKNOWN;
1848 flags |= EIO_READDIR_FOUND_UNKNOWN;
1849 break;
1850
1851 #ifdef DT_FIFO
1852 case DT_FIFO: ent->type = EIO_DT_FIFO; break;
1853 #endif
1854 #ifdef DT_CHR
1855 case DT_CHR: ent->type = EIO_DT_CHR; break;
1856 #endif
1857 #ifdef DT_MPC
1858 case DT_MPC: ent->type = EIO_DT_MPC; break;
1859 #endif
1860 #ifdef DT_DIR
1861 case DT_DIR: ent->type = EIO_DT_DIR; break;
1862 #endif
1863 #ifdef DT_NAM
1864 case DT_NAM: ent->type = EIO_DT_NAM; break;
1865 #endif
1866 #ifdef DT_BLK
1867 case DT_BLK: ent->type = EIO_DT_BLK; break;
1868 #endif
1869 #ifdef DT_MPB
1870 case DT_MPB: ent->type = EIO_DT_MPB; break;
1871 #endif
1872 #ifdef DT_REG
1873 case DT_REG: ent->type = EIO_DT_REG; break;
1874 #endif
1875 #ifdef DT_NWK
1876 case DT_NWK: ent->type = EIO_DT_NWK; break;
1877 #endif
1878 #ifdef DT_CMP
1879 case DT_CMP: ent->type = EIO_DT_CMP; break;
1880 #endif
1881 #ifdef DT_LNK
1882 case DT_LNK: ent->type = EIO_DT_LNK; break;
1883 #endif
1884 #ifdef DT_SOCK
1885 case DT_SOCK: ent->type = EIO_DT_SOCK; break;
1886 #endif
1887 #ifdef DT_DOOR
1888 case DT_DOOR: ent->type = EIO_DT_DOOR; break;
1889 #endif
1890 #ifdef DT_WHT
1891 case DT_WHT: ent->type = EIO_DT_WHT; break;
1892 #endif
1893 }
1894
1895 ent->score = 7;
1896
1897 if (flags & EIO_READDIR_DIRS_FIRST)
1898 {
1899 if (ent->type == EIO_DT_UNKNOWN)
1900 {
1901 if (*name == '.') /* leading dots are likely directories, and, in any case, rare */
1902 ent->score = 1;
1903 else if (!strchr (name, '.')) /* absense of dots indicate likely dirs */
1904 ent->score = len <= 2 ? 4 - len : len <= 4 ? 4 : len <= 7 ? 5 : 6; /* shorter == more likely dir, but avoid too many classes */
1905 }
1906 else if (ent->type == EIO_DT_DIR)
1907 ent->score = 0;
1908 }
1909 }
1910
1911 namesoffs += len; 1977 namesoffs += len;
1912 ++dentoffs; 1978 ++dentoffs;
1913 } 1979 }
1914 1980
1915 if (EIO_CANCELLED (req)) 1981 if (EIO_CANCELLED (req))
1916 { 1982 {
1917 errno = ECANCELED; 1983 errno = ECANCELED;
1918 break; 1984 break;
1919 } 1985 }
1920 1986
1921#ifdef _WIN32 1987#ifdef _WIN32
1922 if (!FindNextFile (dirp, &entp)) 1988 if (!FindNextFile (dirp, &entp))
1923 { 1989 {
1924 FindClose (dirp); 1990 FindClose (dirp);
1925 dirp = 0; 1991 dirp = 0;
1926 } 1992 }
1927#endif 1993#endif
1928 } 1994 }
1929} 1995}
1996
1997/*****************************************************************************/
1998/* working directory stuff */
1999/* various deficiencies in the posix 2008 api force us to */
2000/* keep the absolute path in string form at all times */
2001/* fuck yeah. */
2002
2003#if !HAVE_AT
2004
2005/* a bit like realpath, but usually faster because it doesn'T have to return */
2006/* an absolute or canonical path */
2007static const char *
2008wd_expand (struct tmpbuf *tmpbuf, eio_wd wd, const char *path)
2009{
2010 if (!wd || *path == '/')
2011 return path;
2012
2013 if (path [0] == '.' && !path [1])
2014 return wd->str;
2015
2016 {
2017 int l1 = wd->len;
2018 int l2 = strlen (path);
2019
2020 char *res = tmpbuf_get (tmpbuf, l1 + l2 + 2);
2021
2022 memcpy (res, wd->str, l1);
2023 res [l1] = '/';
2024 memcpy (res + l1 + 1, path, l2 + 1);
2025
2026 return res;
2027 }
2028}
2029
2030#endif
2031
2032static eio_wd
2033eio__wd_open_sync (struct tmpbuf *tmpbuf, eio_wd wd, const char *path)
2034{
2035 int fd;
2036 eio_wd res;
2037 int len = eio__realpath (tmpbuf, wd, path);
2038
2039 if (len < 0)
2040 return EIO_INVALID_WD;
2041
2042#if HAVE_AT
2043 fd = openat (WD2FD (wd), path, O_CLOEXEC | O_SEARCH | O_DIRECTORY);
2044
2045 if (fd < 0)
2046 return EIO_INVALID_WD;
2047#endif
2048
2049 res = malloc (sizeof (*res) + len); /* one extra 0-byte */
2050
2051#if HAVE_AT
2052 res->fd = fd;
2053#endif
2054
2055 res->len = len;
2056 memcpy (res->str, tmpbuf->ptr, len);
2057 res->str [len] = 0;
2058
2059 return res;
2060}
2061
2062eio_wd
2063eio_wd_open_sync (eio_wd wd, const char *path)
2064{
2065 struct tmpbuf tmpbuf = { 0 };
2066 wd = eio__wd_open_sync (&tmpbuf, wd, path);
2067 free (tmpbuf.ptr);
2068
2069 return wd;
2070}
2071
2072void
2073eio_wd_close_sync (eio_wd wd)
2074{
2075 if (wd != EIO_INVALID_WD && wd != EIO_CWD)
2076 {
2077 #if HAVE_AT
2078 close (wd->fd);
2079 #endif
2080 free (wd);
2081 }
2082}
2083
2084#if HAVE_AT
2085
2086/* they forgot these */
2087
2088static int
2089eio__truncateat (int dirfd, const char *path, off_t length)
2090{
2091 int fd = openat (dirfd, path, O_WRONLY | O_CLOEXEC);
2092 int res;
2093
2094 if (fd < 0)
2095 return fd;
2096
2097 res = ftruncate (fd, length);
2098 close (fd);
2099 return res;
2100}
2101
2102static int
2103eio__statvfsat (int dirfd, const char *path, struct statvfs *buf)
2104{
2105 int fd = openat (dirfd, path, O_SEARCH | O_CLOEXEC);
2106 int res;
2107
2108 if (fd < 0)
2109 return fd;
2110
2111 res = fstatvfs (fd, buf);
2112 close (fd);
2113 return res;
2114
2115}
2116
2117#endif
1930 2118
1931/*****************************************************************************/ 2119/*****************************************************************************/
1932 2120
1933#define ALLOC(len) \ 2121#define ALLOC(len) \
1934 if (!req->ptr2) \ 2122 if (!req->ptr2) \
1943 req->result = -1; \ 2131 req->result = -1; \
1944 break; \ 2132 break; \
1945 } \ 2133 } \
1946 } 2134 }
1947 2135
2136static void ecb_noinline ecb_cold
2137etp_proc_init (void)
2138{
2139#if HAVE_PRCTL_SET_NAME
2140 /* provide a more sensible "thread name" */
2141 char name[16 + 1];
2142 const int namelen = sizeof (name) - 1;
2143 int len;
2144
2145 prctl (PR_GET_NAME, (unsigned long)name, 0, 0, 0);
2146 name [namelen] = 0;
2147 len = strlen (name);
2148 strcpy (name + (len <= namelen - 4 ? len : namelen - 4), "/eio");
2149 prctl (PR_SET_NAME, (unsigned long)name, 0, 0, 0);
2150#endif
2151}
2152
1948X_THREAD_PROC (etp_proc) 2153X_THREAD_PROC (etp_proc)
1949{ 2154{
1950 ETP_REQ *req; 2155 ETP_REQ *req;
1951 struct timespec ts; 2156 struct timespec ts;
1952 etp_worker *self = (etp_worker *)thr_arg; 2157 etp_worker *self = (etp_worker *)thr_arg;
1953 2158
1954#if HAVE_PRCTL_SET_NAME 2159 etp_proc_init ();
1955 prctl (PR_SET_NAME, (unsigned long)"eio_thread", 0, 0, 0);
1956#endif
1957 2160
1958 /* try to distribute timeouts somewhat evenly */ 2161 /* try to distribute timeouts somewhat evenly */
1959 ts.tv_nsec = ((unsigned long)self & 1023UL) * (1000000000UL / 1024UL); 2162 ts.tv_nsec = ((unsigned long)self & 1023UL) * (1000000000UL / 1024UL);
1960 2163
1961 for (;;) 2164 for (;;)
1964 2167
1965 X_LOCK (reqlock); 2168 X_LOCK (reqlock);
1966 2169
1967 for (;;) 2170 for (;;)
1968 { 2171 {
1969 self->req = req = reqq_shift (&req_queue); 2172 req = reqq_shift (&req_queue);
1970 2173
1971 if (req) 2174 if (req)
1972 break; 2175 break;
1973 2176
1974 if (ts.tv_sec == 1) /* no request, but timeout detected, let's quit */ 2177 if (ts.tv_sec == 1) /* no request, but timeout detected, let's quit */
2012 ++npending; 2215 ++npending;
2013 2216
2014 if (!reqq_push (&res_queue, req) && want_poll_cb) 2217 if (!reqq_push (&res_queue, req) && want_poll_cb)
2015 want_poll_cb (); 2218 want_poll_cb ();
2016 2219
2017 self->req = 0;
2018 etp_worker_clear (self); 2220 etp_worker_clear (self);
2019 2221
2020 X_UNLOCK (reslock); 2222 X_UNLOCK (reslock);
2021 } 2223 }
2022 2224
2023quit: 2225quit:
2226 free (req);
2227
2024 X_LOCK (wrklock); 2228 X_LOCK (wrklock);
2025 etp_worker_free (self); 2229 etp_worker_free (self);
2026 X_UNLOCK (wrklock); 2230 X_UNLOCK (wrklock);
2027 2231
2028 return 0; 2232 return 0;
2031/*****************************************************************************/ 2235/*****************************************************************************/
2032 2236
2033int ecb_cold 2237int ecb_cold
2034eio_init (void (*want_poll)(void), void (*done_poll)(void)) 2238eio_init (void (*want_poll)(void), void (*done_poll)(void))
2035{ 2239{
2036#if !HAVE_PREADWRITE
2037 X_MUTEX_CREATE (preadwritelock);
2038#endif
2039
2040 return etp_init (want_poll, done_poll); 2240 return etp_init (want_poll, done_poll);
2041} 2241}
2042 2242
2043ecb_inline void 2243ecb_inline void
2044eio_api_destroy (eio_req *req) 2244eio_api_destroy (eio_req *req)
2045{ 2245{
2046 free (req); 2246 free (req);
2047} 2247}
2048 2248
2049#define REQ(rtype) \ 2249#define REQ(rtype) \
2050 eio_req *req; \ 2250 eio_req *req; \
2051 \ 2251 \
2052 req = (eio_req *)calloc (1, sizeof *req); \ 2252 req = (eio_req *)calloc (1, sizeof *req); \
2053 if (!req) \ 2253 if (!req) \
2054 return 0; \ 2254 return 0; \
2068 { \ 2268 { \
2069 eio_api_destroy (req); \ 2269 eio_api_destroy (req); \
2070 return 0; \ 2270 return 0; \
2071 } 2271 }
2072 2272
2273#define SINGLEDOT(ptr) (0[(char *)(ptr)] == '.' && !1[(char *)(ptr)])
2274
2073static void 2275static void
2074eio_execute (etp_worker *self, eio_req *req) 2276eio_execute (etp_worker *self, eio_req *req)
2075{ 2277{
2278#if HAVE_AT
2279 int dirfd;
2280#else
2281 const char *path;
2282#endif
2283
2076 if (ecb_expect_false (EIO_CANCELLED (req))) 2284 if (ecb_expect_false (EIO_CANCELLED (req)))
2077 { 2285 {
2078 req->result = -1; 2286 req->result = -1;
2079 req->errorno = ECANCELED; 2287 req->errorno = ECANCELED;
2080 return; 2288 return;
2081 } 2289 }
2082 2290
2291 if (ecb_expect_false (req->wd == EIO_INVALID_WD))
2292 {
2293 req->result = -1;
2294 req->errorno = ENOENT;
2295 return;
2296 }
2297
2298 if (req->type >= EIO_OPEN)
2299 {
2300 #if HAVE_AT
2301 dirfd = WD2FD (req->wd);
2302 #else
2303 path = wd_expand (&self->tmpbuf, req->wd, req->ptr1);
2304 #endif
2305 }
2306
2083 switch (req->type) 2307 switch (req->type)
2084 { 2308 {
2309 case EIO_WD_OPEN: req->wd = eio__wd_open_sync (&self->tmpbuf, req->wd, req->ptr1);
2310 req->result = req->wd == EIO_INVALID_WD ? -1 : 0;
2311 break;
2312 case EIO_WD_CLOSE: req->result = 0;
2313 eio_wd_close_sync (req->wd); break;
2314
2315 case EIO_SEEK: eio__lseek (req); break;
2085 case EIO_READ: ALLOC (req->size); 2316 case EIO_READ: ALLOC (req->size);
2086 req->result = req->offs >= 0 2317 req->result = req->offs >= 0
2087 ? pread (req->int1, req->ptr2, req->size, req->offs) 2318 ? pread (req->int1, req->ptr2, req->size, req->offs)
2088 : read (req->int1, req->ptr2, req->size); break; 2319 : read (req->int1, req->ptr2, req->size); break;
2089 case EIO_WRITE: req->result = req->offs >= 0 2320 case EIO_WRITE: req->result = req->offs >= 0
2091 : write (req->int1, req->ptr2, req->size); break; 2322 : write (req->int1, req->ptr2, req->size); break;
2092 2323
2093 case EIO_READAHEAD: req->result = readahead (req->int1, req->offs, req->size); break; 2324 case EIO_READAHEAD: req->result = readahead (req->int1, req->offs, req->size); break;
2094 case EIO_SENDFILE: req->result = eio__sendfile (req->int1, req->int2, req->offs, req->size); break; 2325 case EIO_SENDFILE: req->result = eio__sendfile (req->int1, req->int2, req->offs, req->size); break;
2095 2326
2327#if HAVE_AT
2328
2096 case EIO_STAT: ALLOC (sizeof (EIO_STRUCT_STAT)); 2329 case EIO_STAT: ALLOC (sizeof (EIO_STRUCT_STAT));
2097 req->result = stat (req->ptr1, (EIO_STRUCT_STAT *)req->ptr2); break; 2330 req->result = fstatat (dirfd, req->ptr1, (EIO_STRUCT_STAT *)req->ptr2, 0); break;
2098 case EIO_LSTAT: ALLOC (sizeof (EIO_STRUCT_STAT)); 2331 case EIO_LSTAT: ALLOC (sizeof (EIO_STRUCT_STAT));
2332 req->result = fstatat (dirfd, req->ptr1, (EIO_STRUCT_STAT *)req->ptr2, AT_SYMLINK_NOFOLLOW); break;
2333 case EIO_CHOWN: req->result = fchownat (dirfd, req->ptr1, req->int2, req->int3, 0); break;
2334 case EIO_CHMOD: req->result = fchmodat (dirfd, req->ptr1, (mode_t)req->int2, 0); break;
2335 case EIO_TRUNCATE: req->result = eio__truncateat (dirfd, req->ptr1, req->offs); break;
2336 case EIO_OPEN: req->result = openat (dirfd, req->ptr1, req->int1, (mode_t)req->int2); break;
2337
2338 case EIO_UNLINK: req->result = unlinkat (dirfd, req->ptr1, 0); break;
2339 case EIO_RMDIR: /* complications arise because "." cannot be removed, so we might have to expand */
2340 req->result = req->wd && SINGLEDOT (req->ptr1)
2341 ? rmdir (req->wd->str)
2342 : unlinkat (dirfd, req->ptr1, AT_REMOVEDIR); break;
2343 case EIO_MKDIR: req->result = mkdirat (dirfd, req->ptr1, (mode_t)req->int2); break;
2344 case EIO_RENAME: /* complications arise because "." cannot be renamed, so we might have to expand */
2345 req->result = req->wd && SINGLEDOT (req->ptr1)
2346 ? rename (req->wd->str, req->ptr2)
2347 : renameat (dirfd, req->ptr1, WD2FD ((eio_wd)req->int3), req->ptr2); break;
2348 case EIO_LINK: req->result = linkat (dirfd, req->ptr1, WD2FD ((eio_wd)req->int3), req->ptr2, 0); break;
2349 case EIO_SYMLINK: req->result = symlinkat (req->ptr1, dirfd, req->ptr2); break;
2350 case EIO_MKNOD: req->result = mknodat (dirfd, req->ptr1, (mode_t)req->int2, (dev_t)req->offs); break;
2351 case EIO_READLINK: ALLOC (PATH_MAX);
2352 req->result = readlinkat (dirfd, req->ptr1, req->ptr2, PATH_MAX); break;
2353 case EIO_STATVFS: ALLOC (sizeof (EIO_STRUCT_STATVFS));
2354 req->result = eio__statvfsat (dirfd, req->ptr1, (EIO_STRUCT_STATVFS *)req->ptr2); break;
2355 case EIO_UTIME:
2356 case EIO_FUTIME:
2357 {
2358 struct timespec ts[2];
2359 struct timespec *times;
2360
2361 if (req->nv1 != -1. || req->nv2 != -1.)
2362 {
2363 ts[0].tv_sec = req->nv1;
2364 ts[0].tv_nsec = (req->nv1 - ts[0].tv_sec) * 1e9;
2365 ts[1].tv_sec = req->nv2;
2366 ts[1].tv_nsec = (req->nv2 - ts[1].tv_sec) * 1e9;
2367
2368 times = ts;
2369 }
2370 else
2371 times = 0;
2372
2373 req->result = req->type == EIO_FUTIME
2374 ? futimens (req->int1, times)
2375 : utimensat (dirfd, req->ptr1, times, 0);
2376 }
2377 break;
2378
2379#else
2380
2381 case EIO_STAT: ALLOC (sizeof (EIO_STRUCT_STAT));
2382 req->result = stat (path , (EIO_STRUCT_STAT *)req->ptr2); break;
2383 case EIO_LSTAT: ALLOC (sizeof (EIO_STRUCT_STAT));
2099 req->result = lstat (req->ptr1, (EIO_STRUCT_STAT *)req->ptr2); break; 2384 req->result = lstat (path , (EIO_STRUCT_STAT *)req->ptr2); break;
2385 case EIO_CHOWN: req->result = chown (path , req->int2, req->int3); break;
2386 case EIO_CHMOD: req->result = chmod (path , (mode_t)req->int2); break;
2387 case EIO_TRUNCATE: req->result = truncate (path , req->offs); break;
2388 case EIO_OPEN: req->result = open (path , req->int1, (mode_t)req->int2); break;
2389
2390 case EIO_UNLINK: req->result = unlink (path ); break;
2391 case EIO_RMDIR: req->result = rmdir (path ); break;
2392 case EIO_MKDIR: req->result = mkdir (path , (mode_t)req->int2); break;
2393 case EIO_RENAME: req->result = rename (path , req->ptr2); break;
2394 case EIO_LINK: req->result = link (path , req->ptr2); break;
2395 case EIO_SYMLINK: req->result = symlink (path , req->ptr2); break;
2396 case EIO_MKNOD: req->result = mknod (path , (mode_t)req->int2, (dev_t)req->offs); break;
2397 case EIO_READLINK: ALLOC (PATH_MAX);
2398 req->result = readlink (path, req->ptr2, PATH_MAX); break;
2399 case EIO_STATVFS: ALLOC (sizeof (EIO_STRUCT_STATVFS));
2400 req->result = statvfs (path , (EIO_STRUCT_STATVFS *)req->ptr2); break;
2401
2402 case EIO_UTIME:
2403 case EIO_FUTIME:
2404 {
2405 struct timeval tv[2];
2406 struct timeval *times;
2407
2408 if (req->nv1 != -1. || req->nv2 != -1.)
2409 {
2410 tv[0].tv_sec = req->nv1;
2411 tv[0].tv_usec = (req->nv1 - tv[0].tv_sec) * 1e6;
2412 tv[1].tv_sec = req->nv2;
2413 tv[1].tv_usec = (req->nv2 - tv[1].tv_sec) * 1e6;
2414
2415 times = tv;
2416 }
2417 else
2418 times = 0;
2419
2420 req->result = req->type == EIO_FUTIME
2421 ? futimes (req->int1, times)
2422 : utimes (req->ptr1, times);
2423 }
2424 break;
2425
2426#endif
2427
2428 case EIO_REALPATH: if (0 <= (req->result = eio__realpath (&self->tmpbuf, req->wd, req->ptr1)))
2429 {
2430 ALLOC (req->result);
2431 memcpy (req->ptr2, self->tmpbuf.ptr, req->result);
2432 }
2433 break;
2434
2100 case EIO_FSTAT: ALLOC (sizeof (EIO_STRUCT_STAT)); 2435 case EIO_FSTAT: ALLOC (sizeof (EIO_STRUCT_STAT));
2101 req->result = fstat (req->int1, (EIO_STRUCT_STAT *)req->ptr2); break; 2436 req->result = fstat (req->int1, (EIO_STRUCT_STAT *)req->ptr2); break;
2102 2437
2103 case EIO_STATVFS: ALLOC (sizeof (EIO_STRUCT_STATVFS));
2104 req->result = statvfs (req->ptr1, (EIO_STRUCT_STATVFS *)req->ptr2); break;
2105 case EIO_FSTATVFS: ALLOC (sizeof (EIO_STRUCT_STATVFS)); 2438 case EIO_FSTATVFS: ALLOC (sizeof (EIO_STRUCT_STATVFS));
2106 req->result = fstatvfs (req->int1, (EIO_STRUCT_STATVFS *)req->ptr2); break; 2439 req->result = fstatvfs (req->int1, (EIO_STRUCT_STATVFS *)req->ptr2); break;
2107 2440
2108 case EIO_CHOWN: req->result = chown (req->ptr1, req->int2, req->int3); break;
2109 case EIO_FCHOWN: req->result = fchown (req->int1, req->int2, req->int3); break; 2441 case EIO_FCHOWN: req->result = fchown (req->int1, req->int2, req->int3); break;
2110 case EIO_CHMOD: req->result = chmod (req->ptr1, (mode_t)req->int2); break;
2111 case EIO_FCHMOD: req->result = fchmod (req->int1, (mode_t)req->int2); break; 2442 case EIO_FCHMOD: req->result = fchmod (req->int1, (mode_t)req->int2); break;
2112 case EIO_TRUNCATE: req->result = truncate (req->ptr1, req->offs); break;
2113 case EIO_FTRUNCATE: req->result = ftruncate (req->int1, req->offs); break; 2443 case EIO_FTRUNCATE: req->result = ftruncate (req->int1, req->offs); break;
2114 2444
2115 case EIO_OPEN: req->result = open (req->ptr1, req->int1, (mode_t)req->int2); break;
2116 case EIO_CLOSE: req->result = close (req->int1); break; 2445 case EIO_CLOSE: req->result = close (req->int1); break;
2117 case EIO_DUP2: req->result = dup2 (req->int1, req->int2); break; 2446 case EIO_DUP2: req->result = dup2 (req->int1, req->int2); break;
2118 case EIO_UNLINK: req->result = unlink (req->ptr1); break;
2119 case EIO_RMDIR: req->result = rmdir (req->ptr1); break;
2120 case EIO_MKDIR: req->result = mkdir (req->ptr1, (mode_t)req->int2); break;
2121 case EIO_RENAME: req->result = rename (req->ptr1, req->ptr2); break;
2122 case EIO_LINK: req->result = link (req->ptr1, req->ptr2); break;
2123 case EIO_SYMLINK: req->result = symlink (req->ptr1, req->ptr2); break;
2124 case EIO_MKNOD: req->result = mknod (req->ptr1, (mode_t)req->int2, (dev_t)req->offs); break;
2125
2126 case EIO_REALPATH: eio__realpath (req, self); break;
2127
2128 case EIO_READLINK: ALLOC (PATH_MAX);
2129 req->result = readlink (req->ptr1, req->ptr2, PATH_MAX); break;
2130
2131 case EIO_SYNC: req->result = 0; sync (); break; 2447 case EIO_SYNC: req->result = 0; sync (); break;
2132 case EIO_FSYNC: req->result = fsync (req->int1); break; 2448 case EIO_FSYNC: req->result = fsync (req->int1); break;
2133 case EIO_FDATASYNC: req->result = fdatasync (req->int1); break; 2449 case EIO_FDATASYNC: req->result = fdatasync (req->int1); break;
2134 case EIO_SYNCFS: req->result = eio__syncfs (req->int1); break; 2450 case EIO_SYNCFS: req->result = eio__syncfs (req->int1); break;
2135 case EIO_SYNC_FILE_RANGE: req->result = eio__sync_file_range (req->int1, req->offs, req->size, req->int2); break; 2451 case EIO_SYNC_FILE_RANGE: req->result = eio__sync_file_range (req->int1, req->offs, req->size, req->int2); break;
2154 req->result = select (0, 0, 0, 0, &tv); 2470 req->result = select (0, 0, 0, 0, &tv);
2155 } 2471 }
2156#endif 2472#endif
2157 break; 2473 break;
2158 2474
2159 case EIO_UTIME:
2160 case EIO_FUTIME:
2161 {
2162 struct timeval tv[2];
2163 struct timeval *times;
2164
2165 if (req->nv1 != -1. || req->nv2 != -1.)
2166 {
2167 tv[0].tv_sec = req->nv1;
2168 tv[0].tv_usec = (req->nv1 - tv[0].tv_sec) * 1000000.;
2169 tv[1].tv_sec = req->nv2;
2170 tv[1].tv_usec = (req->nv2 - tv[1].tv_sec) * 1000000.;
2171
2172 times = tv;
2173 }
2174 else
2175 times = 0;
2176
2177 req->result = req->type == EIO_FUTIME
2178 ? futimes (req->int1, times)
2179 : utimes (req->ptr1, times);
2180 }
2181 break;
2182
2183 case EIO_GROUP: 2475 case EIO_GROUP:
2184 abort (); /* handled in eio_request */ 2476 abort (); /* handled in eio_request */
2185 2477
2186 case EIO_NOP: 2478 case EIO_NOP:
2187 req->result = 0; 2479 req->result = 0;
2190 case EIO_CUSTOM: 2482 case EIO_CUSTOM:
2191 req->feed (req); 2483 req->feed (req);
2192 break; 2484 break;
2193 2485
2194 default: 2486 default:
2195 errno = ENOSYS;
2196 req->result = -1; 2487 req->result = EIO_ENOSYS ();
2197 break; 2488 break;
2198 } 2489 }
2199 2490
2200 req->errorno = errno; 2491 req->errorno = errno;
2201} 2492}
2202 2493
2203#ifndef EIO_NO_WRAPPERS 2494#ifndef EIO_NO_WRAPPERS
2204 2495
2496eio_req *eio_wd_open (const char *path, int pri, eio_cb cb, void *data)
2497{
2498 REQ (EIO_WD_OPEN); PATH; SEND;
2499}
2500
2501eio_req *eio_wd_close (eio_wd wd, int pri, eio_cb cb, void *data)
2502{
2503 REQ (EIO_WD_CLOSE); req->wd = wd; SEND;
2504}
2505
2205eio_req *eio_nop (int pri, eio_cb cb, void *data) 2506eio_req *eio_nop (int pri, eio_cb cb, void *data)
2206{ 2507{
2207 REQ (EIO_NOP); SEND; 2508 REQ (EIO_NOP); SEND;
2208} 2509}
2209 2510
2268} 2569}
2269 2570
2270eio_req *eio_readahead (int fd, off_t offset, size_t length, int pri, eio_cb cb, void *data) 2571eio_req *eio_readahead (int fd, off_t offset, size_t length, int pri, eio_cb cb, void *data)
2271{ 2572{
2272 REQ (EIO_READAHEAD); req->int1 = fd; req->offs = offset; req->size = length; SEND; 2573 REQ (EIO_READAHEAD); req->int1 = fd; req->offs = offset; req->size = length; SEND;
2574}
2575
2576eio_req *eio_seek (int fd, off_t offset, int whence, int pri, eio_cb cb, void *data)
2577{
2578 REQ (EIO_SEEK); req->int1 = fd; req->offs = offset; req->int2 = whence; SEND;
2273} 2579}
2274 2580
2275eio_req *eio_read (int fd, void *buf, size_t length, off_t offset, int pri, eio_cb cb, void *data) 2581eio_req *eio_read (int fd, void *buf, size_t length, off_t offset, int pri, eio_cb cb, void *data)
2276{ 2582{
2277 REQ (EIO_READ); req->int1 = fd; req->offs = offset; req->size = length; req->ptr2 = buf; SEND; 2583 REQ (EIO_READ); req->int1 = fd; req->offs = offset; req->size = length; req->ptr2 = buf; SEND;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines