ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/libeio/eio.c
(Generate patch)

Comparing libeio/eio.c (file contents):
Revision 1.27 by root, Wed Oct 22 18:15:36 2008 UTC vs.
Revision 1.38 by root, Fri Jun 12 20:01:42 2009 UTC

1/* 1/*
2 * libeio implementation 2 * libeio implementation
3 * 3 *
4 * Copyright (c) 2007,2008 Marc Alexander Lehmann <libeio@schmorp.de> 4 * Copyright (c) 2007,2008,2009 Marc Alexander Lehmann <libeio@schmorp.de>
5 * All rights reserved. 5 * All rights reserved.
6 * 6 *
7 * Redistribution and use in source and binary forms, with or without modifica- 7 * Redistribution and use in source and binary forms, with or without modifica-
8 * tion, are permitted provided that the following conditions are met: 8 * tion, are permitted provided that the following conditions are met:
9 * 9 *
36 * provisions above, a recipient may use your version of this file under 36 * provisions above, a recipient may use your version of this file under
37 * either the BSD or the GPL. 37 * either the BSD or the GPL.
38 */ 38 */
39 39
40#include "eio.h" 40#include "eio.h"
41
42#ifdef EIO_STACKSIZE
43# define XTHREAD_STACKSIZE EIO_STACKSIZE
44#endif
41#include "xthread.h" 45#include "xthread.h"
42 46
43#include <errno.h> 47#include <errno.h>
44#include <stddef.h> 48#include <stddef.h>
45#include <stdlib.h> 49#include <stdlib.h>
64#endif 68#endif
65 69
66#ifdef _WIN32 70#ifdef _WIN32
67 71
68 /*doh*/ 72 /*doh*/
69
70#else 73#else
71 74
72# include "config.h" 75# include "config.h"
73# include <sys/time.h> 76# include <sys/time.h>
74# include <sys/select.h> 77# include <sys/select.h>
78# include <sys/mman.h>
75# include <unistd.h> 79# include <unistd.h>
76# include <utime.h> 80# include <utime.h>
77# include <signal.h> 81# include <signal.h>
78# include <dirent.h> 82# include <dirent.h>
83
84/* POSIX_SOURCE is useless on bsd's, and XOPEN_SOURCE is unreliable there, too */
85# if defined(__FreeBSD__) || defined(__NetBSD__) || defined(__OpenBSD__)
86# define _DIRENT_HAVE_D_TYPE /* sigh */
87# define D_INO(de) (de)->d_fileno
88# define D_NAMLEN(de) (de)->d_namlen
89# elif defined(__linux) || defined(d_ino) || _XOPEN_SOURCE >= 600
90# define D_INO(de) (de)->d_ino
91# endif
92
93#ifdef _D_EXACT_NAMLEN
94# undef D_NAMLEN
95# define D_NAMLEN(de) _D_EXACT_NAMLEN (de)
96#endif
97
98# ifdef _DIRENT_HAVE_D_TYPE
99# define D_TYPE(de) (de)->d_type
100# endif
79 101
80# ifndef EIO_STRUCT_DIRENT 102# ifndef EIO_STRUCT_DIRENT
81# define EIO_STRUCT_DIRENT struct dirent 103# define EIO_STRUCT_DIRENT struct dirent
82# endif 104# endif
83 105
96# else 118# else
97# error sendfile support requested but not available 119# error sendfile support requested but not available
98# endif 120# endif
99#endif 121#endif
100 122
123#ifndef D_TYPE
124# define D_TYPE(de) 0
125#endif
126#ifndef D_INO
127# define D_INO(de) 0
128#endif
129#ifndef D_NAMLEN
130# define D_NAMLEN(de) strlen ((de)->d_name)
131#endif
132
101/* number of seconds after which an idle threads exit */ 133/* number of seconds after which an idle threads exit */
102#define IDLE_TIMEOUT 10 134#define IDLE_TIMEOUT 10
103 135
104/* used for struct dirent, AIX doesn't provide it */ 136/* used for struct dirent, AIX doesn't provide it */
105#ifndef NAME_MAX 137#ifndef NAME_MAX
155 if (wrk->dirp) \ 187 if (wrk->dirp) \
156 { \ 188 { \
157 closedir (wrk->dirp); \ 189 closedir (wrk->dirp); \
158 wrk->dirp = 0; \ 190 wrk->dirp = 0; \
159 } 191 }
192
160#define ETP_WORKER_COMMON \ 193#define ETP_WORKER_COMMON \
161 void *dbuf; \ 194 void *dbuf; \
162 DIR *dirp; 195 DIR *dirp;
163 196
164/*****************************************************************************/ 197/*****************************************************************************/
767 800
768 X_LOCK (preadwritelock); 801 X_LOCK (preadwritelock);
769 ooffset = lseek (fd, 0, SEEK_CUR); 802 ooffset = lseek (fd, 0, SEEK_CUR);
770 lseek (fd, offset, SEEK_SET); 803 lseek (fd, offset, SEEK_SET);
771 res = write (fd, buf, count); 804 res = write (fd, buf, count);
772 lseek (fd, offset, SEEK_SET); 805 lseek (fd, ooffset, SEEK_SET);
773 X_UNLOCK (preadwritelock); 806 X_UNLOCK (preadwritelock);
774 807
775 return res; 808 return res;
776} 809}
777#endif 810#endif
829 | (flags & EIO_SYNC_FILE_RANGE_WAIT_AFTER ? SYNC_FILE_RANGE_WAIT_AFTER : 0); 862 | (flags & EIO_SYNC_FILE_RANGE_WAIT_AFTER ? SYNC_FILE_RANGE_WAIT_AFTER : 0);
830 } 863 }
831 864
832 res = sync_file_range (fd, offset, nbytes, flags); 865 res = sync_file_range (fd, offset, nbytes, flags);
833 866
834 if (res != ENOSYS) 867 if (!res || errno != ENOSYS)
835 return res; 868 return res;
836#endif 869#endif
837 870
838 /* even though we could play tricks with the flags, it's better to always 871 /* even though we could play tricks with the flags, it's better to always
839 * call fdatasync, as thta matches the expectation of it's users best */ 872 * call fdatasync, as thta matches the expectation of it's users best */
957 } 990 }
958 991
959 return res; 992 return res;
960} 993}
961 994
995static signed char
996eio_dent_cmp (const eio_dirent *a, const eio_dirent *b)
997{
998 return b->score - a->score ? b->score - a->score /* works because our signed char is always 0..100 */
999 : a->inode < b->inode ? -1 : a->inode > b->inode ? 1 : 0;
1000}
1001
1002#define EIO_QSORT_CUTOFF 20 /* quite high, but performs well on many filesystems */
1003
1004static void
1005eio_dent_sort (eio_dirent *dents, int size)
1006{
1007 int i, j;
1008
1009 if (size > EIO_QSORT_CUTOFF * 3) /* skip quicksort for small directories */
1010 {
1011 /* first, use quicksort */
1012 /* should be good for 2**31 entries */
1013 struct rng { int l, r; } rng [32];
1014
1015 i = 0;
1016 rng[0].l = 0;
1017 rng[0].r = size;
1018
1019 while (expect_true (i >= 0))
1020 {
1021 int L = rng [i].l;
1022 int R = rng [i].r - 1;
1023
1024 if (expect_false (L + EIO_QSORT_CUTOFF < R))
1025 {
1026 eio_dirent piv = dents [L];
1027
1028 while (L < R)
1029 {
1030 while (eio_dent_cmp (&dents [R], &piv) >= 0 && L < R)
1031 --R;
1032
1033 if (L < R)
1034 dents [L++] = dents [R];
1035
1036 while (eio_dent_cmp (&dents [L], &piv) <= 0 && L < R)
1037 ++L;
1038
1039 if (L < R)
1040 dents [R--] = dents [L];
1041 }
1042
1043 dents [L] = piv;
1044
1045 ++i;
1046 rng [i].l = L + 1;
1047 rng [i].r = rng [i - 1].r;
1048 rng [i - 1].r = L;
1049
1050 if (rng [i].r - rng [i].l > rng [i - 1].r - rng [i - 1].l)
1051 {
1052 struct rng t;
1053
1054 t = rng [i]; rng [i] = rng [i - 1]; rng [i - 1] = t;
1055 }
1056 }
1057 else
1058 --i;
1059 }
1060 }
1061
1062 /* use a simple insertion sort at the end */
1063 for (i = 1; i < size; ++i)
1064 {
1065 eio_dirent value = dents [i];
1066
1067 for (j = i - 1; j >= 0 && eio_dent_cmp (&dents [j], &value) > 0; --j)
1068 dents [j + 1] = dents [j];
1069
1070 dents [j + 1] = value;
1071 }
1072}
1073
962/* read a full directory */ 1074/* read a full directory */
963static void 1075static void
964eio__scandir (eio_req *req, etp_worker *self) 1076eio__scandir (eio_req *req, etp_worker *self)
965{ 1077{
966 DIR *dirp; 1078 DIR *dirp;
967 EIO_STRUCT_DIRENT *entp; 1079 EIO_STRUCT_DIRENT *entp;
968 char *name, *names; 1080 char *name, *names;
969 int memlen = 4096; 1081 int namesalloc = 4096;
970 int memofs = 0; 1082 int namesoffs = 0;
1083 int flags = req->int1;
1084 eio_dirent *dents = 0;
1085 int dentalloc = 128;
971 int res = 0; 1086 int dentoffs = 0;
1087
1088 req->result = -1;
1089
1090 if (!(flags & EIO_READDIR_DENTS))
1091 flags &= ~(EIO_READDIR_DIRS_FIRST | EIO_READDIR_STAT_ORDER);
972 1092
973 X_LOCK (wrklock); 1093 X_LOCK (wrklock);
974 /* the corresponding closedir is in ETP_WORKER_CLEAR */ 1094 /* the corresponding closedir is in ETP_WORKER_CLEAR */
975 self->dirp = dirp = opendir (req->ptr1); 1095 self->dirp = dirp = opendir (req->ptr1);
976 req->flags |= EIO_FLAG_PTR2_FREE; 1096 req->flags |= EIO_FLAG_PTR1_FREE | EIO_FLAG_PTR2_FREE;
977 req->ptr2 = names = malloc (memlen); 1097 req->ptr1 = names = malloc (namesalloc);
1098 req->ptr2 = dents = flags ? malloc (dentalloc * sizeof (eio_dirent)) : 0;
978 X_UNLOCK (wrklock); 1099 X_UNLOCK (wrklock);
979 1100
980 if (dirp && names) 1101 if (dirp && names && (!flags || dents))
981 for (;;) 1102 for (;;)
982 { 1103 {
983 errno = 0; 1104 errno = 0;
984 entp = readdir (dirp); 1105 entp = readdir (dirp);
985 1106
986 if (!entp) 1107 if (!entp)
1108 {
1109 if (errno)
1110 break;
1111
1112 /* sort etc. */
1113 req->int1 = flags;
1114 req->result = dentoffs;
1115
1116 if (dents)
1117 {
1118 eio_dirent *ent = dents + dentoffs;
1119
1120 while (ent > dents)
1121 (--ent)->name = names + (size_t)ent->name;
1122 }
1123
1124 if (flags & EIO_READDIR_STAT_ORDER
1125 || !(~flags & (EIO_READDIR_DIRS_FIRST | EIO_READDIR_FOUND_UNKNOWN)))
1126 eio_dent_sort (dents, dentoffs); /* score depends of DIRS_FIRST */
1127 else if (flags & EIO_READDIR_DIRS_FIRST)
1128 {
1129 /* in this case, all is known, and we just put dirs first and sort them */
1130 eio_dirent *ent = dents + dentoffs;
1131 eio_dirent *dir = dents;
1132
1133 /* now move dirs to the front, and non-dirs to the back */
1134 /* by walking from both sides and swapping if necessary */
1135 while (ent > dir)
1136 {
1137 if (dir->type == DT_DIR)
1138 ++dir;
1139 else
1140 {
1141 --ent;
1142
1143 if (ent->type == DT_DIR)
1144 {
1145 eio_dirent tmp = *dir;
1146 *dir = *ent;
1147 *ent = tmp;
1148
1149 ++dir;
1150 }
1151 }
1152 }
1153
1154 /* now sort the dirs only */
1155 eio_dent_sort (dents, dir - dents);
1156 }
1157
1158 /* only provide the names array unless DENTS is specified */
1159 if (!(flags & EIO_READDIR_DENTS))
1160 {
1161 X_LOCK (wrklock);
1162 assert (!dents);
1163 req->ptr1 = 0;
1164 req->ptr2 = names;
1165 X_UNLOCK (wrklock);
1166 }
1167
987 break; 1168 break;
1169 }
988 1170
1171 /* now add the entry to our list(s) */
989 name = entp->d_name; 1172 name = entp->d_name;
990 1173
1174 /* skip . and .. entries */
991 if (name [0] != '.' || (name [1] && (name [1] != '.' || name [2]))) 1175 if (name [0] != '.' || (name [1] && (name [1] != '.' || name [2])))
992 { 1176 {
993 int len = strlen (name) + 1; 1177 int len = D_NAMLEN (entp) + 1;
994 1178
995 res++; 1179 while (expect_false (namesoffs + len > namesalloc))
996
997 while (memofs + len > memlen)
998 { 1180 {
999 memlen *= 2; 1181 namesalloc *= 2;
1000 X_LOCK (wrklock); 1182 X_LOCK (wrklock);
1001 req->ptr2 = names = realloc (names, memlen); 1183 req->ptr1 = names = realloc (names, namesalloc);
1002 X_UNLOCK (wrklock); 1184 X_UNLOCK (wrklock);
1003 1185
1004 if (!names) 1186 if (!names)
1005 break; 1187 break;
1006 } 1188 }
1007 1189
1008 memcpy (names + memofs, name, len); 1190 memcpy (names + namesoffs, name, len);
1191
1192 if (dents)
1193 {
1194 struct eio_dirent *ent;
1195
1196 if (expect_false (dentoffs == dentalloc))
1197 {
1198 dentalloc *= 2;
1199 X_LOCK (wrklock);
1200 req->ptr2 = dents = realloc (dents, dentalloc * sizeof (eio_dirent));
1201 X_UNLOCK (wrklock);
1202
1203 if (!dents)
1204 break;
1205 }
1206
1207 ent = dents + dentoffs;
1208
1209 ent->name = (char *)(size_t)namesoffs; /* rather dirtily we store the offset in the pointer */
1210 ent->namelen = len - 1;
1211 ent->inode = D_INO (entp);
1212
1213 switch (D_TYPE (entp))
1214 {
1215 default:
1216 ent->type = EIO_DT_UNKNOWN;
1217 flags |= EIO_READDIR_FOUND_UNKNOWN;
1218 break;
1219
1220 #ifdef DT_FIFO
1221 case DT_FIFO: ent->type = EIO_DT_FIFO; break;
1222 #endif
1223 #ifdef DT_CHR
1224 case DT_CHR: ent->type = EIO_DT_CHR; break;
1225 #endif
1226 #ifdef DT_MPC
1227 case DT_MPC: ent->type = EIO_DT_MPC; break;
1228 #endif
1229 #ifdef DT_DIR
1230 case DT_DIR: ent->type = EIO_DT_DIR; break;
1231 #endif
1232 #ifdef DT_NAM
1233 case DT_NAM: ent->type = EIO_DT_NAM; break;
1234 #endif
1235 #ifdef DT_BLK
1236 case DT_BLK: ent->type = EIO_DT_BLK; break;
1237 #endif
1238 #ifdef DT_MPB
1239 case DT_MPB: ent->type = EIO_DT_MPB; break;
1240 #endif
1241 #ifdef DT_REG
1242 case DT_REG: ent->type = EIO_DT_REG; break;
1243 #endif
1244 #ifdef DT_NWK
1245 case DT_NWK: ent->type = EIO_DT_NWK; break;
1246 #endif
1247 #ifdef DT_CMP
1248 case DT_CMP: ent->type = EIO_DT_CMP; break;
1249 #endif
1250 #ifdef DT_LNK
1251 case DT_LNK: ent->type = EIO_DT_LNK; break;
1252 #endif
1253 #ifdef DT_SOCK
1254 case DT_SOCK: ent->type = EIO_DT_SOCK; break;
1255 #endif
1256 #ifdef DT_DOOR
1257 case DT_DOOR: ent->type = EIO_DT_DOOR; break;
1258 #endif
1259 #ifdef DT_WHT
1260 case DT_WHT: ent->type = EIO_DT_WHT; break;
1261 #endif
1262 }
1263
1264 ent->score = 0;
1265
1266 if (flags & EIO_READDIR_DIRS_FIRST)
1267 {
1268 if (ent->type == EIO_DT_UNKNOWN)
1269 {
1270 if (*name == '.') /* leading dots are likely directories, and, in any case, rare */
1271 ent->score = 98;
1272 else if (!strchr (name, '.')) /* absense of dots indicate likely dirs */
1273 ent->score = len <= 2 ? len + 6 : len <= 4 ? 5 : len <= 7 ? 4 : 1; /* shorter == more likely dir, but avoid too many classes */
1274 }
1275 else if (ent->type == EIO_DT_DIR)
1276 ent->score = 100;
1277 }
1278 }
1279
1009 memofs += len; 1280 namesoffs += len;
1281 ++dentoffs;
1282 }
1283
1284 if (EIO_CANCELLED (req))
1285 {
1286 errno = ECANCELED;
1287 break;
1010 } 1288 }
1011 } 1289 }
1012
1013 if (errno)
1014 res = -1;
1015
1016 req->result = res;
1017} 1290}
1018 1291
1019#if !(_POSIX_MAPPED_FILES && _POSIX_SYNCHRONIZED_IO) 1292#if !(_POSIX_MAPPED_FILES && _POSIX_SYNCHRONIZED_IO)
1020# undef msync 1293# undef msync
1021# define msync(a,b,c) ENOSYS 1294# define msync(a,b,c) ((errno = ENOSYS), -1)
1022#endif 1295#endif
1023 1296
1024int 1297int
1025eio__mtouch (void *mem, size_t len, int flags) 1298eio__mtouch (void *mem, size_t len, int flags)
1026{ 1299{
1441eio_req *eio_rmdir (const char *path, int pri, eio_cb cb, void *data) 1714eio_req *eio_rmdir (const char *path, int pri, eio_cb cb, void *data)
1442{ 1715{
1443 return eio__1path (EIO_RMDIR, path, pri, cb, data); 1716 return eio__1path (EIO_RMDIR, path, pri, cb, data);
1444} 1717}
1445 1718
1446eio_req *eio_readdir (const char *path, int pri, eio_cb cb, void *data) 1719eio_req *eio_readdir (const char *path, int flags, int pri, eio_cb cb, void *data)
1447{ 1720{
1448 return eio__1path (EIO_READDIR, path, pri, cb, data); 1721 REQ (EIO_READDIR); PATH; req->int1 = flags; SEND;
1449} 1722}
1450 1723
1451eio_req *eio_mknod (const char *path, mode_t mode, dev_t dev, int pri, eio_cb cb, void *data) 1724eio_req *eio_mknod (const char *path, mode_t mode, dev_t dev, int pri, eio_cb cb, void *data)
1452{ 1725{
1453 REQ (EIO_MKNOD); PATH; req->int2 = (long)mode; req->int3 = (long)dev; SEND; 1726 REQ (EIO_MKNOD); PATH; req->int2 = (long)mode; req->int3 = (long)dev; SEND;
1542/* misc garbage */ 1815/* misc garbage */
1543 1816
1544ssize_t eio_sendfile_sync (int ofd, int ifd, off_t offset, size_t count) 1817ssize_t eio_sendfile_sync (int ofd, int ifd, off_t offset, size_t count)
1545{ 1818{
1546 etp_worker wrk; 1819 etp_worker wrk;
1820 ssize_t ret;
1547 1821
1548 wrk.dbuf = 0; 1822 wrk.dbuf = 0;
1549 1823
1550 eio__sendfile (ofd, ifd, offset, count, &wrk); 1824 ret = eio__sendfile (ofd, ifd, offset, count, &wrk);
1551 1825
1552 if (wrk.dbuf) 1826 if (wrk.dbuf)
1553 free (wrk.dbuf); 1827 free (wrk.dbuf);
1554}
1555 1828
1829 return ret;
1830}
1831

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines