[ViewVC] Diff of: cvs/deliantra/server/include/util.h

Comparing deliantra/server/include/util.h (file contents):
Revision 1.78 by root, Thu Dec 4 03:48:19 2008 UTC vs.
Revision 1.85 by root, Thu Jan 1 20:49:48 2009 UTC

 #if __GNUC__ >= 3
 # define is_constant(c)             __builtin_constant_p (c)
 # define expect(expr,value)         __builtin_expect ((expr),(value))
 # define prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality)
+# define noinline                   __attribute__((__noinline__))
 #else
 # define is_constant(c)             0
 # define expect(expr,value)         (expr)
 # define prefetch(addr,rw,locality)
+# define noinline
 #endif
 #if __GNUC__ < 4 || (__GNUC__ == 4 || __GNUC_MINOR__ < 4)
 # define decltype(x) typeof(x)
 #endif
 // put into ifs if you are very sure that the expression
 // is mostly true or mosty false. note that these return
 // booleans, not the expression.
-#define expect_false(expr) expect ((expr) != 0, 0)
+#define expect_false(expr) expect ((expr) ? 1 : 0, 0)
-#define expect_true(expr)  expect ((expr) != 0, 1)
+#define expect_true(expr)  expect ((expr) ? 1 : 0, 1)
 #include <pthread.h>
 #include <cstddef>
 #include <cmath>
 #endif
 // use C0X decltype for auto declarations until ISO C++ sanctifies them (if ever)
 #define auto(var,expr) decltype(expr) var = (expr)
-// very ugly macro that basicaly declares and initialises a variable
+// very ugly macro that basically declares and initialises a variable
 // that is in scope for the next statement only
 // works only for stuff that can be assigned 0 and converts to false
 // (note: works great for pointers)
 // most ugly macro I ever wrote
 #define statementvar(type, name, value) if (type name = 0) { } else if (((name) = (value)), 1)
 // as a is often a constant while b is the variable. it is still a bug, though.
 template<typename T, typename U> static inline T min (T a, U b) { return (U)a < b ? (U)a : b; }
 template<typename T, typename U> static inline T max (T a, U b) { return (U)a > b ? (U)a : b; }
 template<typename T, typename U, typename V> static inline T clamp (T v, U a, V b) { return v < (T)a ? (T)a : v >(T)b ? (T)b : v; }
-template<typename T> static inline void min_it (T &v, T m) { v = min (v, m); }
+template<typename T, typename U> static inline void min_it (T &v, U m) { v = min (v, (T)m); }
-template<typename T> static inline void max_it (T &v, T m) { v = max (v, m); }
+template<typename T, typename U> static inline void max_it (T &v, U m) { v = max (v, (T)m); }
-template<typename T> static inline void clamp_it (T &v, T a, T b) { v = clamp (v, a, b); }
+template<typename T, typename U, typename V> static inline void clamp_it (T &v, U a, V b) { v = clamp (v, (T)a, (T)b); }
 template<typename T, typename U> static inline void swap (T& a, U& b) { T t=a; a=(T)b; b=(U)t; }
 template<typename T, typename U, typename V> static inline T min (T a, U b, V c) { return min (a, min (b, c)); }
 template<typename T, typename U, typename V> static inline T max (T a, U b, V c) { return max (a, max (b, c)); }
+// sign returns -1 or +1
+template<typename T>
+static inline T sign (T v) { return v < 0 ? -1 : +1; }
+// relies on 2c representation
+template<>
+inline sint8 sign (sint8 v) { return 1 - (sint8 (uint8 (v) >> 7) * 2); }
+// sign0 returns -1, 0 or +1
+template<typename T>
+static inline T sign0 (T v) { return v ? sign (v) : 0; }
 // div, with correct rounding (< 0.5 downwards, >=0.5 upwards)
 template<typename T> static inline T div    (T val, T div) { return (val + div / 2) / div; }
 // div, round-up
 template<typename T> static inline T div_ru (T val, T div) { return (val + div - 1) / div; }
 // P. L'Ecuyer, “Maximally Equidistributed Combined Tausworthe Generators”, Mathematics of Computation, 65, 213 (1996), 203–213.
 // http://www.iro.umontreal.ca/~lecuyer/myftp/papers/tausme.ps
 // http://www.iro.umontreal.ca/~lecuyer/myftp/papers/tausme2.ps
 struct tausworthe_random_generator
 {
-  // generator
   uint32_t state [4];
   void operator =(const tausworthe_random_generator &src)
   {
     state [0] = src.state [0];
     state [3] = src.state [3];
   }
   void seed (uint32_t seed);
   uint32_t next ();
+};
+// Xorshift RNGs, George Marsaglia
+// http://www.jstatsoft.org/v08/i14/paper
+// this one is about 40% faster than the tausworthe one above (i.e. not much),
+// despite the inlining, and has the issue of only creating 2**32-1 numbers.
+struct xorshift_random_generator
+{
+  uint32_t x, y;
+  void operator =(const xorshift_random_generator &src)
+  {
+    x = src.x;
+    y = src.y;
+  }
+  void seed (uint32_t seed)
+  {
+    x = seed;
+    y = seed * 69069U;
+  }
+  uint32_t next ()
+  {
+    uint32_t t = x ^ (x << 10);
+    x = y;
+    y = y ^ (y >> 13) ^ t ^ (t >> 10);
+    return y;
+  }
+};
+template<class generator>
+struct random_number_generator : generator
+{
   // uniform distribution, 0 .. max (0, num - 1)
   uint32_t operator ()(uint32_t num)
   {
-    return is_constant (num)
+    return !is_constant (num) ? get_range (num)                        // non-constant
-             ? (next () * (uint64_t)num) >> 32U
+         : num & (num - 1)    ? (this->next () * (uint64_t)num) >> 32U // constant, non-power-of-two
-             : get_range (num);
+         :                      this->next () & (num - 1);             // constant, power-of-two
   }
   // return a number within (min .. max)
   int operator () (int r_min, int r_max)
   {
 protected:
   uint32_t get_range (uint32_t r_max);
   int get_range (int r_min, int r_max);
 };
-typedef tausworthe_random_generator rand_gen;
+typedef random_number_generator<tausworthe_random_generator> rand_gen;
 extern rand_gen rndm, rmg_rndm;
 INTERFACE_CLASS (attachable)
 struct refcnt_base
 struct str_hash
 {
   std::size_t operator ()(const char *s) const
   {
-    unsigned long hash = 0;
+#if 0
+    uint32_t hash = 0;
     /* use the one-at-a-time hash function, which supposedly is
      * better than the djb2-like one used by perl5.005, but
      * certainly is better then the bug used here before.
      * see http://burtleburtle.net/bob/hash/doobs.html
       }
     hash += hash <<  3;
     hash ^= hash >> 11;
     hash += hash << 15;
+#else
+    // use FNV-1a hash (http://isthe.com/chongo/tech/comp/fnv/)
+    // it is about twice as fast as the one-at-a-time one,
+    // with good distribution.
+    // FNV-1a is faster on many cpus because the multiplication
+    // runs concurrent with the looping logic.
+    uint32_t hash = 2166136261;
+    while (*s)
+      hash = (hash ^ *s++) * 16777619;
+#endif
     return hash;
   }
 };

Diff Legend

-–
+Removed lines
-+
+Added lines
-<
+Changed lines
->
+Changed lines

Comparing deliantra/server/include/util.h (file contents): Revision 1.78 by root, Thu Dec 4 03:48:19 2008 UTC vs. Revision 1.85 by root, Thu Jan 1 20:49:48 2009 UTC

Diff Legend

Comparing deliantra/server/include/util.h (file contents):
Revision 1.78 by root, Thu Dec 4 03:48:19 2008 UTC vs.
Revision 1.85 by root, Thu Jan 1 20:49:48 2009 UTC