1 | /* |
1 | /* |
2 | * This file is part of Deliantra, the Roguelike Realtime MMORPG. |
2 | * This file is part of Deliantra, the Roguelike Realtime MMORPG. |
3 | * |
3 | * |
|
|
4 | * Copyright (©) 2017,2018 Marc Alexander Lehmann / the Deliantra team |
4 | * Copyright (©) 2005,2006,2007,2008 Marc Alexander Lehmann / Robin Redeker / the Deliantra team |
5 | * Copyright (©) 2005,2006,2007,2008,2009,2010,2011,2012,2013,2014,2015,2016 Marc Alexander Lehmann / Robin Redeker / the Deliantra team |
5 | * |
6 | * |
6 | * Deliantra is free software: you can redistribute it and/or modify |
7 | * Deliantra is free software: you can redistribute it and/or modify it under |
7 | * it under the terms of the GNU General Public License as published by |
8 | * the terms of the Affero GNU General Public License as published by the |
8 | * the Free Software Foundation, either version 3 of the License, or |
9 | * Free Software Foundation, either version 3 of the License, or (at your |
9 | * (at your option) any later version. |
10 | * option) any later version. |
10 | * |
11 | * |
11 | * This program is distributed in the hope that it will be useful, |
12 | * This program is distributed in the hope that it will be useful, |
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
14 | * GNU General Public License for more details. |
15 | * GNU General Public License for more details. |
15 | * |
16 | * |
16 | * You should have received a copy of the GNU General Public License |
17 | * You should have received a copy of the Affero GNU General Public License |
17 | * along with this program. If not, see <http://www.gnu.org/licenses/>. |
18 | * and the GNU General Public License along with this program. If not, see |
|
|
19 | * <http://www.gnu.org/licenses/>. |
18 | * |
20 | * |
19 | * The authors can be reached via e-mail to <support@deliantra.net> |
21 | * The authors can be reached via e-mail to <support@deliantra.net> |
20 | */ |
22 | */ |
21 | |
23 | |
22 | #ifndef UTIL_H__ |
24 | #ifndef UTIL_H__ |
23 | #define UTIL_H__ |
25 | #define UTIL_H__ |
24 | |
26 | |
25 | #define DEBUG_POISON 0x00 // poison memory before freeing it if != 0 |
27 | #define DEBUG_POISON 0x00 // poison memory before freeing it if != 0 |
26 | #define DEBUG_SALLOC 0 // add a debug wrapper around all sallocs |
28 | #define DEBUG_SALLOC 0 // add a debug wrapper around all sallocs |
27 | #define PREFER_MALLOC 0 // use malloc and not the slice allocator |
29 | #define PREFER_MALLOC 0 // use malloc and not the slice allocator |
28 | |
|
|
29 | #if __GNUC__ >= 3 |
|
|
30 | # define is_constant(c) __builtin_constant_p (c) |
|
|
31 | # define expect(expr,value) __builtin_expect ((expr),(value)) |
|
|
32 | # define prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality) |
|
|
33 | # define noinline __attribute__((__noinline__)) |
|
|
34 | #else |
|
|
35 | # define is_constant(c) 0 |
|
|
36 | # define expect(expr,value) (expr) |
|
|
37 | # define prefetch(addr,rw,locality) |
|
|
38 | # define noinline |
|
|
39 | #endif |
|
|
40 | |
|
|
41 | #if __GNUC__ < 4 || (__GNUC__ == 4 || __GNUC_MINOR__ < 4) |
|
|
42 | # define decltype(x) typeof(x) |
|
|
43 | #endif |
|
|
44 | |
|
|
45 | // put into ifs if you are very sure that the expression |
|
|
46 | // is mostly true or mosty false. note that these return |
|
|
47 | // booleans, not the expression. |
|
|
48 | #define expect_false(expr) expect ((expr) ? 1 : 0, 0) |
|
|
49 | #define expect_true(expr) expect ((expr) ? 1 : 0, 1) |
|
|
50 | |
30 | |
51 | #include <pthread.h> |
31 | #include <pthread.h> |
52 | |
32 | |
53 | #include <cstddef> |
33 | #include <cstddef> |
54 | #include <cmath> |
34 | #include <cmath> |
55 | #include <new> |
35 | #include <new> |
56 | #include <vector> |
36 | #include <vector> |
57 | |
37 | |
58 | #include <glib.h> |
38 | #include <glib.h> |
59 | |
39 | |
|
|
40 | #include <flat_hash_map.hpp> |
|
|
41 | |
60 | #include <shstr.h> |
42 | #include <shstr.h> |
61 | #include <traits.h> |
43 | #include <traits.h> |
|
|
44 | |
|
|
45 | #include "ecb.h" |
62 | |
46 | |
63 | #if DEBUG_SALLOC |
47 | #if DEBUG_SALLOC |
64 | # define g_slice_alloc0(s) debug_slice_alloc0(s) |
48 | # define g_slice_alloc0(s) debug_slice_alloc0(s) |
65 | # define g_slice_alloc(s) debug_slice_alloc(s) |
49 | # define g_slice_alloc(s) debug_slice_alloc(s) |
66 | # define g_slice_free1(s,p) debug_slice_free1(s,p) |
50 | # define g_slice_free1(s,p) debug_slice_free1(s,p) |
… | |
… | |
71 | # define g_slice_alloc0(s) calloc (1, (s)) |
55 | # define g_slice_alloc0(s) calloc (1, (s)) |
72 | # define g_slice_alloc(s) malloc ((s)) |
56 | # define g_slice_alloc(s) malloc ((s)) |
73 | # define g_slice_free1(s,p) free ((p)) |
57 | # define g_slice_free1(s,p) free ((p)) |
74 | #endif |
58 | #endif |
75 | |
59 | |
76 | // use C0X decltype for auto declarations until ISO C++ sanctifies them (if ever) |
|
|
77 | #define auto(var,expr) decltype(expr) var = (expr) |
|
|
78 | |
|
|
79 | // very ugly macro that basically declares and initialises a variable |
60 | // very ugly macro that basically declares and initialises a variable |
80 | // that is in scope for the next statement only |
61 | // that is in scope for the next statement only |
81 | // works only for stuff that can be assigned 0 and converts to false |
62 | // works only for stuff that can be assigned 0 and converts to false |
82 | // (note: works great for pointers) |
63 | // (note: works great for pointers) |
83 | // most ugly macro I ever wrote |
64 | // most ugly macro I ever wrote |
… | |
… | |
89 | |
70 | |
90 | // in range excluding end |
71 | // in range excluding end |
91 | #define IN_RANGE_EXC(val,beg,end) \ |
72 | #define IN_RANGE_EXC(val,beg,end) \ |
92 | ((unsigned int)(val) - (unsigned int)(beg) < (unsigned int)(end) - (unsigned int)(beg)) |
73 | ((unsigned int)(val) - (unsigned int)(beg) < (unsigned int)(end) - (unsigned int)(beg)) |
93 | |
74 | |
94 | void cleanup (const char *cause, bool make_core = false); |
75 | ecb_cold void cleanup (const char *cause, bool make_core = false); |
95 | void fork_abort (const char *msg); |
76 | ecb_cold void fork_abort (const char *msg); |
96 | |
77 | |
97 | // rationale for using (U) not (T) is to reduce signed/unsigned issues, |
78 | // rationale for using (U) not (T) is to reduce signed/unsigned issues, |
98 | // as a is often a constant while b is the variable. it is still a bug, though. |
79 | // as a is often a constant while b is the variable. it is still a bug, though. |
99 | template<typename T, typename U> static inline T min (T a, U b) { return (U)a < b ? (U)a : b; } |
80 | template<typename T, typename U> static inline T min (T a, U b) { return a < (T)b ? a : (T)b; } |
100 | template<typename T, typename U> static inline T max (T a, U b) { return (U)a > b ? (U)a : b; } |
81 | template<typename T, typename U> static inline T max (T a, U b) { return a > (T)b ? a : (T)b; } |
101 | template<typename T, typename U, typename V> static inline T clamp (T v, U a, V b) { return v < (T)a ? (T)a : v >(T)b ? (T)b : v; } |
82 | template<typename T, typename U, typename V> static inline T clamp (T v, U a, V b) { return v < (T)a ? (T)a : v >(T)b ? (T)b : v; } |
102 | |
83 | |
103 | template<typename T, typename U> static inline void min_it (T &v, U m) { v = min (v, (T)m); } |
84 | template<typename T, typename U> static inline void min_it (T &v, U m) { v = min (v, (T)m); } |
104 | template<typename T, typename U> static inline void max_it (T &v, U m) { v = max (v, (T)m); } |
85 | template<typename T, typename U> static inline void max_it (T &v, U m) { v = max (v, (T)m); } |
105 | template<typename T, typename U, typename V> static inline void clamp_it (T &v, U a, V b) { v = clamp (v, (T)a, (T)b); } |
86 | template<typename T, typename U, typename V> static inline void clamp_it (T &v, U a, V b) { v = clamp (v, (T)a, (T)b); } |
… | |
… | |
112 | // sign returns -1 or +1 |
93 | // sign returns -1 or +1 |
113 | template<typename T> |
94 | template<typename T> |
114 | static inline T sign (T v) { return v < 0 ? -1 : +1; } |
95 | static inline T sign (T v) { return v < 0 ? -1 : +1; } |
115 | // relies on 2c representation |
96 | // relies on 2c representation |
116 | template<> |
97 | template<> |
117 | inline sint8 sign (sint8 v) { return 1 - (sint8 (uint8 (v) >> 7) * 2); } |
98 | inline sint8 sign (sint8 v) { return 1 - (sint8 (uint8 (v) >> 7) * 2); } |
|
|
99 | template<> |
|
|
100 | inline sint16 sign (sint16 v) { return 1 - (sint16 (uint16 (v) >> 15) * 2); } |
|
|
101 | template<> |
|
|
102 | inline sint32 sign (sint32 v) { return 1 - (sint32 (uint32 (v) >> 31) * 2); } |
118 | |
103 | |
119 | // sign0 returns -1, 0 or +1 |
104 | // sign0 returns -1, 0 or +1 |
120 | template<typename T> |
105 | template<typename T> |
121 | static inline T sign0 (T v) { return v ? sign (v) : 0; } |
106 | static inline T sign0 (T v) { return v ? sign (v) : 0; } |
122 | |
107 | |
|
|
108 | //clashes with C++0x |
|
|
109 | template<typename T, typename U> |
|
|
110 | static inline T copysign (T a, U b) { return a > 0 ? b : -b; } |
|
|
111 | |
|
|
112 | // div* only work correctly for div > 0 |
123 | // div, with correct rounding (< 0.5 downwards, >=0.5 upwards) |
113 | // div, with correct rounding (< 0.5 downwards, >=0.5 upwards) |
124 | template<typename T> static inline T div (T val, T div) { return (val + div / 2) / div; } |
114 | template<typename T> static inline T div (T val, T div) |
|
|
115 | { |
|
|
116 | return ecb_expect_false (val < 0) ? - ((-val + (div - 1) / 2) / div) : (val + div / 2) / div; |
|
|
117 | } |
|
|
118 | |
|
|
119 | template<> inline float div (float val, float div) { return val / div; } |
|
|
120 | template<> inline double div (double val, double div) { return val / div; } |
|
|
121 | |
125 | // div, round-up |
122 | // div, round-up |
126 | template<typename T> static inline T div_ru (T val, T div) { return (val + div - 1) / div; } |
123 | template<typename T> static inline T div_ru (T val, T div) |
|
|
124 | { |
|
|
125 | return ecb_expect_false (val < 0) ? - ((-val ) / div) : (val + div - 1) / div; |
|
|
126 | } |
127 | // div, round-down |
127 | // div, round-down |
128 | template<typename T> static inline T div_rd (T val, T div) { return (val ) / div; } |
128 | template<typename T> static inline T div_rd (T val, T div) |
|
|
129 | { |
|
|
130 | return ecb_expect_false (val < 0) ? - ((-val + (div - 1) ) / div) : (val ) / div; |
|
|
131 | } |
129 | |
132 | |
|
|
133 | // lerp* only work correctly for min_in < max_in |
|
|
134 | // Linear intERPolate, scales val from min_in..max_in to min_out..max_out |
130 | template<typename T> |
135 | template<typename T> |
131 | static inline T |
136 | static inline T |
132 | lerp (T val, T min_in, T max_in, T min_out, T max_out) |
137 | lerp (T val, T min_in, T max_in, T min_out, T max_out) |
133 | { |
138 | { |
134 | return min_out + div <T> ((val - min_in) * (max_out - min_out), max_in - min_in); |
139 | return min_out + div <T> ((val - min_in) * (max_out - min_out), max_in - min_in); |
… | |
… | |
193 | int32_t d = b - a; |
198 | int32_t d = b - a; |
194 | d &= d >> 31; |
199 | d &= d >> 31; |
195 | return b - d; |
200 | return b - d; |
196 | } |
201 | } |
197 | |
202 | |
198 | // this is much faster than crossfires original algorithm |
203 | // this is much faster than crossfire's original algorithm |
199 | // on modern cpus |
204 | // on modern cpus |
200 | inline int |
205 | inline int |
201 | isqrt (int n) |
206 | isqrt (int n) |
202 | { |
207 | { |
203 | return (int)sqrtf ((float)n); |
208 | return (int)sqrtf ((float)n); |
|
|
209 | } |
|
|
210 | |
|
|
211 | // this is kind of like the ^^ operator, if it would exist, without sequence point. |
|
|
212 | // more handy than it looks like, due to the implicit !! done on its arguments |
|
|
213 | inline bool |
|
|
214 | logical_xor (bool a, bool b) |
|
|
215 | { |
|
|
216 | return a != b; |
|
|
217 | } |
|
|
218 | |
|
|
219 | inline bool |
|
|
220 | logical_implies (bool a, bool b) |
|
|
221 | { |
|
|
222 | return a <= b; |
204 | } |
223 | } |
205 | |
224 | |
206 | // this is only twice as fast as naive sqrtf (dx*dy+dy*dy) |
225 | // this is only twice as fast as naive sqrtf (dx*dy+dy*dy) |
207 | #if 0 |
226 | #if 0 |
208 | // and has a max. error of 6 in the range -100..+100. |
227 | // and has a max. error of 6 in the range -100..+100. |
209 | #else |
228 | #else |
210 | // and has a max. error of 9 in the range -100..+100. |
229 | // and has a max. error of 9 in the range -100..+100. |
211 | #endif |
230 | #endif |
212 | inline int |
231 | inline int |
213 | idistance (int dx, int dy) |
232 | idistance (int dx, int dy) |
214 | { |
233 | { |
215 | unsigned int dx_ = abs (dx); |
234 | unsigned int dx_ = abs (dx); |
216 | unsigned int dy_ = abs (dy); |
235 | unsigned int dy_ = abs (dy); |
217 | |
236 | |
218 | #if 0 |
237 | #if 0 |
219 | return dx_ > dy_ |
238 | return dx_ > dy_ |
… | |
… | |
222 | #else |
241 | #else |
223 | return dx_ + dy_ - min (dx_, dy_) * 5 / 8; |
242 | return dx_ + dy_ - min (dx_, dy_) * 5 / 8; |
224 | #endif |
243 | #endif |
225 | } |
244 | } |
226 | |
245 | |
|
|
246 | // can be substantially faster than floor, if your value range allows for it |
|
|
247 | template<typename T> |
|
|
248 | inline T |
|
|
249 | fastfloor (T x) |
|
|
250 | { |
|
|
251 | return std::floor (x); |
|
|
252 | } |
|
|
253 | |
|
|
254 | inline float |
|
|
255 | fastfloor (float x) |
|
|
256 | { |
|
|
257 | return sint32(x) - (x < 0); |
|
|
258 | } |
|
|
259 | |
|
|
260 | inline double |
|
|
261 | fastfloor (double x) |
|
|
262 | { |
|
|
263 | return sint64(x) - (x < 0); |
|
|
264 | } |
|
|
265 | |
227 | /* |
266 | /* |
228 | * absdir(int): Returns a number between 1 and 8, which represent |
267 | * absdir(int): Returns a number between 1 and 8, which represent |
229 | * the "absolute" direction of a number (it actually takes care of |
268 | * the "absolute" direction of a number (it actually takes care of |
230 | * "overflow" in previous calculations of a direction). |
269 | * "overflow" in previous calculations of a direction). |
231 | */ |
270 | */ |
… | |
… | |
233 | absdir (int d) |
272 | absdir (int d) |
234 | { |
273 | { |
235 | return ((d - 1) & 7) + 1; |
274 | return ((d - 1) & 7) + 1; |
236 | } |
275 | } |
237 | |
276 | |
|
|
277 | #define for_all_bits_sparse_32(mask, idxvar) \ |
|
|
278 | for (uint32_t idxvar, mask_ = mask; \ |
|
|
279 | mask_ && ((idxvar = ecb_ctz32 (mask_)), mask_ &= ~(1 << idxvar), 1);) |
|
|
280 | |
238 | extern ssize_t slice_alloc; // statistics |
281 | extern ssize_t slice_alloc; // statistics |
239 | |
282 | |
240 | void *salloc_ (int n) throw (std::bad_alloc); |
283 | void *salloc_ (int n) noexcept; |
241 | void *salloc_ (int n, void *src) throw (std::bad_alloc); |
284 | void *salloc_ (int n, void *src) noexcept; |
242 | |
285 | |
243 | // strictly the same as g_slice_alloc, but never returns 0 |
286 | // strictly the same as g_slice_alloc, but never returns 0 |
244 | template<typename T> |
287 | template<typename T> |
245 | inline T *salloc (int n = 1) throw (std::bad_alloc) { return (T *)salloc_ (n * sizeof (T)); } |
288 | inline T *salloc (int n = 1) { return (T *)salloc_ (n * sizeof (T)); } |
246 | |
289 | |
247 | // also copies src into the new area, like "memdup" |
290 | // also copies src into the new area, like "memdup" |
248 | // if src is 0, clears the memory |
291 | // if src is 0, clears the memory |
249 | template<typename T> |
292 | template<typename T> |
250 | inline T *salloc (int n, T *src) throw (std::bad_alloc) { return (T *)salloc_ (n * sizeof (T), (void *)src); } |
293 | inline T *salloc (int n, T *src) { return (T *)salloc_ (n * sizeof (T), (void *)src); } |
251 | |
294 | |
252 | // clears the memory |
295 | // clears the memory |
253 | template<typename T> |
296 | template<typename T> |
254 | inline T *salloc0(int n = 1) throw (std::bad_alloc) { return (T *)salloc_ (n * sizeof (T), 0); } |
297 | inline T *salloc0(int n = 1) { return (T *)salloc_ (n * sizeof (T), 0); } |
255 | |
298 | |
256 | // for symmetry |
299 | // for symmetry |
257 | template<typename T> |
300 | template<typename T> |
258 | inline void sfree (T *ptr, int n = 1) throw () |
301 | inline void sfree (T *ptr, int n = 1) noexcept |
259 | { |
302 | { |
260 | if (expect_true (ptr)) |
303 | if (ecb_expect_true (ptr)) |
261 | { |
304 | { |
262 | slice_alloc -= n * sizeof (T); |
305 | slice_alloc -= n * sizeof (T); |
263 | if (DEBUG_POISON) memset (ptr, DEBUG_POISON, n * sizeof (T)); |
306 | if (DEBUG_POISON) memset (ptr, DEBUG_POISON, n * sizeof (T)); |
264 | g_slice_free1 (n * sizeof (T), (void *)ptr); |
307 | g_slice_free1 (n * sizeof (T), (void *)ptr); |
265 | assert (slice_alloc >= 0);//D |
|
|
266 | } |
308 | } |
267 | } |
309 | } |
268 | |
310 | |
269 | // nulls the pointer |
311 | // nulls the pointer |
270 | template<typename T> |
312 | template<typename T> |
271 | inline void sfree0 (T *&ptr, int n = 1) throw () |
313 | inline void sfree0 (T *&ptr, int n = 1) noexcept |
272 | { |
314 | { |
273 | sfree<T> (ptr, n); |
315 | sfree<T> (ptr, n); |
274 | ptr = 0; |
316 | ptr = 0; |
275 | } |
317 | } |
276 | |
318 | |
… | |
… | |
332 | sfree ((char *)p, s); |
374 | sfree ((char *)p, s); |
333 | } |
375 | } |
334 | }; |
376 | }; |
335 | |
377 | |
336 | // a STL-compatible allocator that uses g_slice |
378 | // a STL-compatible allocator that uses g_slice |
337 | // boy, this is verbose |
379 | // boy, this is much less verbose in newer C++ versions |
338 | template<typename Tp> |
380 | template<typename Tp> |
339 | struct slice_allocator |
381 | struct slice_allocator |
340 | { |
382 | { |
341 | typedef size_t size_type; |
383 | using value_type = Tp; |
342 | typedef ptrdiff_t difference_type; |
|
|
343 | typedef Tp *pointer; |
|
|
344 | typedef const Tp *const_pointer; |
|
|
345 | typedef Tp &reference; |
|
|
346 | typedef const Tp &const_reference; |
|
|
347 | typedef Tp value_type; |
|
|
348 | |
384 | |
349 | template <class U> |
385 | slice_allocator () noexcept { } |
350 | struct rebind |
386 | template<class U> slice_allocator (const slice_allocator<U> &) noexcept {} |
|
|
387 | |
|
|
388 | value_type *allocate (std::size_t n) |
351 | { |
389 | { |
352 | typedef slice_allocator<U> other; |
390 | return salloc<Tp> (n); |
|
|
391 | } |
|
|
392 | |
|
|
393 | void deallocate (value_type *p, std::size_t n) |
|
|
394 | { |
|
|
395 | sfree<Tp> (p, n); |
|
|
396 | } |
|
|
397 | }; |
|
|
398 | |
|
|
399 | template<class T, class U> |
|
|
400 | bool operator == (const slice_allocator<T> &, const slice_allocator<U> &) noexcept |
|
|
401 | { |
|
|
402 | return true; |
|
|
403 | } |
|
|
404 | |
|
|
405 | template<class T, class U> |
|
|
406 | bool operator != (const slice_allocator<T> &x, const slice_allocator<U> &y) noexcept |
|
|
407 | { |
|
|
408 | return !(x == y); |
|
|
409 | } |
|
|
410 | |
|
|
411 | // basically a memory area, but refcounted |
|
|
412 | struct refcnt_buf |
|
|
413 | { |
|
|
414 | char *data; |
|
|
415 | |
|
|
416 | refcnt_buf (size_t size = 0); |
|
|
417 | refcnt_buf (void *data, size_t size); |
|
|
418 | |
|
|
419 | refcnt_buf (const refcnt_buf &src) |
|
|
420 | { |
|
|
421 | data = src.data; |
|
|
422 | inc (); |
|
|
423 | } |
|
|
424 | |
|
|
425 | ~refcnt_buf (); |
|
|
426 | |
|
|
427 | refcnt_buf &operator =(const refcnt_buf &src); |
|
|
428 | |
|
|
429 | operator char *() |
|
|
430 | { |
|
|
431 | return data; |
|
|
432 | } |
|
|
433 | |
|
|
434 | size_t size () const |
|
|
435 | { |
|
|
436 | return _size (); |
|
|
437 | } |
|
|
438 | |
|
|
439 | protected: |
|
|
440 | enum { |
|
|
441 | overhead = sizeof (uint32_t) * 2 |
353 | }; |
442 | }; |
354 | |
443 | |
355 | slice_allocator () throw () { } |
444 | uint32_t &_size () const |
356 | slice_allocator (const slice_allocator &) throw () { } |
|
|
357 | template<typename Tp2> |
|
|
358 | slice_allocator (const slice_allocator<Tp2> &) throw () { } |
|
|
359 | |
|
|
360 | ~slice_allocator () { } |
|
|
361 | |
|
|
362 | pointer address (reference x) const { return &x; } |
|
|
363 | const_pointer address (const_reference x) const { return &x; } |
|
|
364 | |
|
|
365 | pointer allocate (size_type n, const_pointer = 0) |
|
|
366 | { |
445 | { |
367 | return salloc<Tp> (n); |
446 | return ((unsigned int *)data)[-2]; |
368 | } |
447 | } |
369 | |
448 | |
370 | void deallocate (pointer p, size_type n) |
449 | uint32_t &_refcnt () const |
371 | { |
450 | { |
372 | sfree<Tp> (p, n); |
451 | return ((unsigned int *)data)[-1]; |
373 | } |
452 | } |
374 | |
453 | |
375 | size_type max_size () const throw () |
|
|
376 | { |
|
|
377 | return size_t (-1) / sizeof (Tp); |
|
|
378 | } |
|
|
379 | |
|
|
380 | void construct (pointer p, const Tp &val) |
|
|
381 | { |
|
|
382 | ::new (p) Tp (val); |
|
|
383 | } |
|
|
384 | |
|
|
385 | void destroy (pointer p) |
|
|
386 | { |
|
|
387 | p->~Tp (); |
|
|
388 | } |
|
|
389 | }; |
|
|
390 | |
|
|
391 | // P. L'Ecuyer, “Maximally Equidistributed Combined Tausworthe Generators”, Mathematics of Computation, 65, 213 (1996), 203–213. |
|
|
392 | // http://www.iro.umontreal.ca/~lecuyer/myftp/papers/tausme.ps |
|
|
393 | // http://www.iro.umontreal.ca/~lecuyer/myftp/papers/tausme2.ps |
|
|
394 | struct tausworthe_random_generator |
|
|
395 | { |
|
|
396 | uint32_t state [4]; |
|
|
397 | |
|
|
398 | void operator =(const tausworthe_random_generator &src) |
|
|
399 | { |
|
|
400 | state [0] = src.state [0]; |
|
|
401 | state [1] = src.state [1]; |
|
|
402 | state [2] = src.state [2]; |
|
|
403 | state [3] = src.state [3]; |
|
|
404 | } |
|
|
405 | |
|
|
406 | void seed (uint32_t seed); |
|
|
407 | uint32_t next (); |
|
|
408 | }; |
|
|
409 | |
|
|
410 | // Xorshift RNGs, George Marsaglia |
|
|
411 | // http://www.jstatsoft.org/v08/i14/paper |
|
|
412 | // this one is about 40% faster than the tausworthe one above (i.e. not much), |
|
|
413 | // despite the inlining, and has the issue of only creating 2**32-1 numbers. |
|
|
414 | // see also http://www.iro.umontreal.ca/~lecuyer/myftp/papers/xorshift.pdf |
|
|
415 | struct xorshift_random_generator |
|
|
416 | { |
|
|
417 | uint32_t x, y; |
|
|
418 | |
|
|
419 | void operator =(const xorshift_random_generator &src) |
|
|
420 | { |
|
|
421 | x = src.x; |
|
|
422 | y = src.y; |
|
|
423 | } |
|
|
424 | |
|
|
425 | void seed (uint32_t seed) |
454 | void _alloc (uint32_t size) |
426 | { |
455 | { |
427 | x = seed; |
456 | data = ((char *)salloc<char> (size + overhead)) + overhead; |
428 | y = seed * 69069U; |
457 | _size () = size; |
|
|
458 | _refcnt () = 1; |
429 | } |
459 | } |
430 | |
460 | |
431 | uint32_t next () |
461 | void _dealloc (); |
432 | { |
|
|
433 | uint32_t t = x ^ (x << 10); |
|
|
434 | x = y; |
|
|
435 | y = y ^ (y >> 13) ^ t ^ (t >> 10); |
|
|
436 | return y; |
|
|
437 | } |
|
|
438 | }; |
|
|
439 | |
462 | |
440 | template<class generator> |
463 | void inc () |
441 | struct random_number_generator : generator |
|
|
442 | { |
|
|
443 | // uniform distribution, 0 .. max (0, num - 1) |
|
|
444 | uint32_t operator ()(uint32_t num) |
|
|
445 | { |
464 | { |
446 | return !is_constant (num) ? get_range (num) // non-constant |
465 | ++_refcnt (); |
447 | : num & (num - 1) ? (this->next () * (uint64_t)num) >> 32U // constant, non-power-of-two |
|
|
448 | : this->next () & (num - 1); // constant, power-of-two |
|
|
449 | } |
466 | } |
450 | |
467 | |
451 | // return a number within (min .. max) |
468 | void dec () |
452 | int operator () (int r_min, int r_max) |
|
|
453 | { |
469 | { |
454 | return is_constant (r_min) && is_constant (r_max) && r_min <= r_max |
470 | if (!--_refcnt ()) |
455 | ? r_min + operator ()(r_max - r_min + 1) |
471 | _dealloc (); |
456 | : get_range (r_min, r_max); |
|
|
457 | } |
472 | } |
458 | |
|
|
459 | double operator ()() |
|
|
460 | { |
|
|
461 | return this->next () / (double)0xFFFFFFFFU; |
|
|
462 | } |
|
|
463 | |
|
|
464 | protected: |
|
|
465 | uint32_t get_range (uint32_t r_max); |
|
|
466 | int get_range (int r_min, int r_max); |
|
|
467 | }; |
473 | }; |
468 | |
|
|
469 | typedef random_number_generator<tausworthe_random_generator> rand_gen; |
|
|
470 | |
|
|
471 | extern rand_gen rndm, rmg_rndm; |
|
|
472 | |
474 | |
473 | INTERFACE_CLASS (attachable) |
475 | INTERFACE_CLASS (attachable) |
474 | struct refcnt_base |
476 | struct refcnt_base |
475 | { |
477 | { |
476 | typedef int refcnt_t; |
478 | typedef int refcnt_t; |
… | |
… | |
491 | // p if not null |
493 | // p if not null |
492 | refcnt_base::refcnt_t *refcnt_ref () { return p ? &p->refcnt : &refcnt_dummy; } |
494 | refcnt_base::refcnt_t *refcnt_ref () { return p ? &p->refcnt : &refcnt_dummy; } |
493 | |
495 | |
494 | void refcnt_dec () |
496 | void refcnt_dec () |
495 | { |
497 | { |
496 | if (!is_constant (p)) |
498 | if (!ecb_is_constant (p)) |
497 | --*refcnt_ref (); |
499 | --*refcnt_ref (); |
498 | else if (p) |
500 | else if (p) |
499 | --p->refcnt; |
501 | --p->refcnt; |
500 | } |
502 | } |
501 | |
503 | |
502 | void refcnt_inc () |
504 | void refcnt_inc () |
503 | { |
505 | { |
504 | if (!is_constant (p)) |
506 | if (!ecb_is_constant (p)) |
505 | ++*refcnt_ref (); |
507 | ++*refcnt_ref (); |
506 | else if (p) |
508 | else if (p) |
507 | ++p->refcnt; |
509 | ++p->refcnt; |
508 | } |
510 | } |
509 | |
511 | |
… | |
… | |
538 | typedef refptr<maptile> maptile_ptr; |
540 | typedef refptr<maptile> maptile_ptr; |
539 | typedef refptr<object> object_ptr; |
541 | typedef refptr<object> object_ptr; |
540 | typedef refptr<archetype> arch_ptr; |
542 | typedef refptr<archetype> arch_ptr; |
541 | typedef refptr<client> client_ptr; |
543 | typedef refptr<client> client_ptr; |
542 | typedef refptr<player> player_ptr; |
544 | typedef refptr<player> player_ptr; |
|
|
545 | typedef refptr<region> region_ptr; |
|
|
546 | |
|
|
547 | #define STRHSH_NULL 2166136261 |
|
|
548 | |
|
|
549 | static inline uint32_t |
|
|
550 | strhsh (const char *s) |
|
|
551 | { |
|
|
552 | // use FNV-1a hash (http://isthe.com/chongo/tech/comp/fnv/) |
|
|
553 | // it is about twice as fast as the one-at-a-time one, |
|
|
554 | // with good distribution. |
|
|
555 | // FNV-1a is faster on many cpus because the multiplication |
|
|
556 | // runs concurrently with the looping logic. |
|
|
557 | // we modify the hash a bit to improve its distribution |
|
|
558 | uint32_t hash = STRHSH_NULL; |
|
|
559 | |
|
|
560 | while (*s) |
|
|
561 | hash = (hash ^ *s++) * 16777619U; |
|
|
562 | |
|
|
563 | return hash ^ (hash >> 16); |
|
|
564 | } |
|
|
565 | |
|
|
566 | static inline uint32_t |
|
|
567 | memhsh (const char *s, size_t len) |
|
|
568 | { |
|
|
569 | uint32_t hash = STRHSH_NULL; |
|
|
570 | |
|
|
571 | while (len--) |
|
|
572 | hash = (hash ^ *s++) * 16777619U; |
|
|
573 | |
|
|
574 | return hash; |
|
|
575 | } |
543 | |
576 | |
544 | struct str_hash |
577 | struct str_hash |
545 | { |
578 | { |
546 | std::size_t operator ()(const char *s) const |
579 | std::size_t operator ()(const char *s) const |
547 | { |
580 | { |
548 | #if 0 |
|
|
549 | uint32_t hash = 0; |
|
|
550 | |
|
|
551 | /* use the one-at-a-time hash function, which supposedly is |
|
|
552 | * better than the djb2-like one used by perl5.005, but |
|
|
553 | * certainly is better then the bug used here before. |
|
|
554 | * see http://burtleburtle.net/bob/hash/doobs.html |
|
|
555 | */ |
|
|
556 | while (*s) |
|
|
557 | { |
|
|
558 | hash += *s++; |
|
|
559 | hash += hash << 10; |
|
|
560 | hash ^= hash >> 6; |
|
|
561 | } |
|
|
562 | |
|
|
563 | hash += hash << 3; |
|
|
564 | hash ^= hash >> 11; |
|
|
565 | hash += hash << 15; |
|
|
566 | #else |
|
|
567 | // use FNV-1a hash (http://isthe.com/chongo/tech/comp/fnv/) |
|
|
568 | // it is about twice as fast as the one-at-a-time one, |
|
|
569 | // with good distribution. |
|
|
570 | // FNV-1a is faster on many cpus because the multiplication |
|
|
571 | // runs concurrent with the looping logic. |
|
|
572 | uint32_t hash = 2166136261; |
|
|
573 | |
|
|
574 | while (*s) |
|
|
575 | hash = (hash ^ *s++) * 16777619; |
|
|
576 | #endif |
|
|
577 | |
|
|
578 | return hash; |
581 | return strhsh (s); |
579 | } |
582 | } |
|
|
583 | |
|
|
584 | std::size_t operator ()(const shstr &s) const |
|
|
585 | { |
|
|
586 | return strhsh (s); |
|
|
587 | } |
|
|
588 | |
|
|
589 | typedef ska::power_of_two_hash_policy hash_policy; |
580 | }; |
590 | }; |
581 | |
591 | |
582 | struct str_equal |
592 | struct str_equal |
583 | { |
593 | { |
584 | bool operator ()(const char *a, const char *b) const |
594 | bool operator ()(const char *a, const char *b) const |
… | |
… | |
610 | } |
620 | } |
611 | }; |
621 | }; |
612 | |
622 | |
613 | // This container blends advantages of linked lists |
623 | // This container blends advantages of linked lists |
614 | // (efficiency) with vectors (random access) by |
624 | // (efficiency) with vectors (random access) by |
615 | // by using an unordered vector and storing the vector |
625 | // using an unordered vector and storing the vector |
616 | // index inside the object. |
626 | // index inside the object. |
617 | // |
627 | // |
618 | // + memory-efficient on most 64 bit archs |
628 | // + memory-efficient on most 64 bit archs |
619 | // + O(1) insert/remove |
629 | // + O(1) insert/remove |
620 | // + free unique (but varying) id for inserted objects |
630 | // + free unique (but varying) id for inserted objects |
… | |
… | |
657 | insert (&obj); |
667 | insert (&obj); |
658 | } |
668 | } |
659 | |
669 | |
660 | void erase (T *obj) |
670 | void erase (T *obj) |
661 | { |
671 | { |
662 | unsigned int pos = obj->*indexmember; |
672 | object_vector_index pos = obj->*indexmember; |
663 | obj->*indexmember = 0; |
673 | obj->*indexmember = 0; |
664 | |
674 | |
665 | if (pos < this->size ()) |
675 | if (pos < this->size ()) |
666 | { |
676 | { |
667 | (*this)[pos - 1] = (*this)[this->size () - 1]; |
677 | (*this)[pos - 1] = (*this)[this->size () - 1]; |
… | |
… | |
675 | { |
685 | { |
676 | erase (&obj); |
686 | erase (&obj); |
677 | } |
687 | } |
678 | }; |
688 | }; |
679 | |
689 | |
|
|
690 | ///////////////////////////////////////////////////////////////////////////// |
|
|
691 | |
|
|
692 | // something like a vector or stack, but without |
|
|
693 | // out of bounds checking |
|
|
694 | template<typename T> |
|
|
695 | struct fixed_stack |
|
|
696 | { |
|
|
697 | T *data; |
|
|
698 | int size; |
|
|
699 | int max; |
|
|
700 | |
|
|
701 | fixed_stack () |
|
|
702 | : size (0), data (0) |
|
|
703 | { |
|
|
704 | } |
|
|
705 | |
|
|
706 | fixed_stack (int max) |
|
|
707 | : size (0), max (max) |
|
|
708 | { |
|
|
709 | data = salloc<T> (max); |
|
|
710 | } |
|
|
711 | |
|
|
712 | void reset (int new_max) |
|
|
713 | { |
|
|
714 | sfree (data, max); |
|
|
715 | size = 0; |
|
|
716 | max = new_max; |
|
|
717 | data = salloc<T> (max); |
|
|
718 | } |
|
|
719 | |
|
|
720 | void free () |
|
|
721 | { |
|
|
722 | sfree (data, max); |
|
|
723 | data = 0; |
|
|
724 | } |
|
|
725 | |
|
|
726 | ~fixed_stack () |
|
|
727 | { |
|
|
728 | sfree (data, max); |
|
|
729 | } |
|
|
730 | |
|
|
731 | T &operator[](int idx) |
|
|
732 | { |
|
|
733 | return data [idx]; |
|
|
734 | } |
|
|
735 | |
|
|
736 | void push (T v) |
|
|
737 | { |
|
|
738 | data [size++] = v; |
|
|
739 | } |
|
|
740 | |
|
|
741 | T &pop () |
|
|
742 | { |
|
|
743 | return data [--size]; |
|
|
744 | } |
|
|
745 | |
|
|
746 | T remove (int idx) |
|
|
747 | { |
|
|
748 | T v = data [idx]; |
|
|
749 | |
|
|
750 | data [idx] = data [--size]; |
|
|
751 | |
|
|
752 | return v; |
|
|
753 | } |
|
|
754 | }; |
|
|
755 | |
|
|
756 | ///////////////////////////////////////////////////////////////////////////// |
|
|
757 | |
680 | // basically does what strncpy should do, but appends "..." to strings exceeding length |
758 | // basically does what strncpy should do, but appends "..." to strings exceeding length |
681 | // returns the number of bytes actually used (including \0) |
759 | // returns the number of bytes actually used (including \0) |
682 | int assign (char *dst, const char *src, int maxsize); |
760 | int assign (char *dst, const char *src, int maxsize); |
683 | |
761 | |
684 | // type-safe version of assign |
762 | // type-safe version of assign |
… | |
… | |
693 | // return current time as timestamp |
771 | // return current time as timestamp |
694 | tstamp now (); |
772 | tstamp now (); |
695 | |
773 | |
696 | int similar_direction (int a, int b); |
774 | int similar_direction (int a, int b); |
697 | |
775 | |
698 | // like sprintf, but returns a "static" buffer |
776 | // like v?sprintf, but returns a "static" buffer |
699 | const char *format (const char *format, ...); |
777 | char *vformat (const char *format, va_list ap); |
|
|
778 | char *format (const char *format, ...) ecb_attribute ((format (printf, 1, 2))); |
|
|
779 | |
|
|
780 | // safety-check player input which will become object->msg |
|
|
781 | bool msg_is_safe (const char *msg); |
700 | |
782 | |
701 | ///////////////////////////////////////////////////////////////////////////// |
783 | ///////////////////////////////////////////////////////////////////////////// |
702 | // threads, very very thin wrappers around pthreads |
784 | // threads, very very thin wrappers around pthreads |
703 | |
785 | |
704 | struct thread |
786 | struct thread |