[ViewVC] Diff of: cvs/libecb/ecb.h

Comparing libecb/ecb.h (file contents):
Revision 1.192 by root, Mon Jun 21 23:59:58 2021 UTC vs.
Revision 1.200 by root, Fri Aug 20 20:12:33 2021 UTC

 #ifndef ECB_H
 #define ECB_H
 /* 16 bits major, 16 bits minor */
-#define ECB_VERSION 0x00010009
+#define ECB_VERSION 0x0001000a
 #include <string.h> /* for memcpy */
 #if defined (_WIN32) && !defined (__MINGW32__)
   typedef   signed char   int8_t;
 ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count);
 ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count);
 ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count);
 ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count);
-ecb_inline ecb_const uint8_t  ecb_rotl8  (uint8_t  x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); }
+ecb_inline ecb_const uint8_t  ecb_rotl8  (uint8_t  x, unsigned int count) { return (x >> (-count &  7)) | (x << (count &  7)); }
-ecb_inline ecb_const uint8_t  ecb_rotr8  (uint8_t  x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); }
+ecb_inline ecb_const uint8_t  ecb_rotr8  (uint8_t  x, unsigned int count) { return (x << (-count &  7)) | (x >> (count &  7)); }
-ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); }
+ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (-count & 15)) | (x << (count & 15)); }
-ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); }
+ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (-count & 15)) | (x >> (count & 15)); }
-ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); }
+ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (-count & 31)) | (x << (count & 31)); }
-ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); }
+ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (-count & 31)) | (x >> (count & 31)); }
-ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); }
+ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (-count & 63)) | (x << (count & 63)); }
-ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); }
+ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (-count & 63)) | (x >> (count & 63)); }
 #if ECB_CPP
 inline uint8_t  ecb_ctz (uint8_t  v) { return ecb_ctz32 (v); }
 inline uint16_t ecb_ctz (uint16_t v) { return ecb_ctz32 (v); }
 ecb_inline void ecb_poke_u64_u (void *ptr, uint64_t v) { memcpy (ptr, &v, sizeof (v)); }
 ecb_inline void ecb_poke_be_u16_u (void *ptr, uint_fast16_t v) { ecb_poke_u16_u (ptr, ecb_host_to_be_u16 (v)); }
 ecb_inline void ecb_poke_be_u32_u (void *ptr, uint_fast32_t v) { ecb_poke_u32_u (ptr, ecb_host_to_be_u32 (v)); }
 ecb_inline void ecb_poke_be_u64_u (void *ptr, uint_fast64_t v) { ecb_poke_u64_u (ptr, ecb_host_to_be_u64 (v)); }
 ecb_inline void ecb_poke_le_u16_u (void *ptr, uint_fast16_t v) { ecb_poke_u16_u (ptr, ecb_host_to_le_u16 (v)); }
 ecb_inline void ecb_poke_le_u32_u (void *ptr, uint_fast32_t v) { ecb_poke_u32_u (ptr, ecb_host_to_le_u32 (v)); }
 ecb_inline void ecb_poke_le_u64_u (void *ptr, uint_fast64_t v) { ecb_poke_u64_u (ptr, ecb_host_to_le_u64 (v)); }
 #if ECB_CPP
 template<typename T> inline void ecb_poke_be   (void *ptr, T v) { return ecb_poke  <T> (ptr, ecb_host_to_be (v)); }
 template<typename T> inline void ecb_poke_le   (void *ptr, T v) { return ecb_poke  <T> (ptr, ecb_host_to_le (v)); }
 template<typename T> inline void ecb_poke_u    (void *ptr, T v) { memcpy (ptr, &v, sizeof (v)); }
 template<typename T> inline void ecb_poke_be_u (void *ptr, T v) { return ecb_poke_u<T> (ptr, ecb_host_to_be (v)); }
 template<typename T> inline void ecb_poke_le_u (void *ptr, T v) { return ecb_poke_u<T> (ptr, ecb_host_to_le (v)); }
+#endif
+/*****************************************************************************/
+/* pointer/integer hashing */
+/* based on hash by Chris Wellons, https://nullprogram.com/blog/2018/07/31/ */
+ecb_function_ uint32_t ecb_mix32 (uint32_t v);
+ecb_function_ uint32_t ecb_mix32 (uint32_t v)
+{
+  v ^= v >> 16; v *= 0x7feb352dU;
+  v ^= v >> 15; v *= 0x846ca68bU;
+  v ^= v >> 16;
+  return v;
+}
+ecb_function_ uint32_t ecb_unmix32 (uint32_t v);
+ecb_function_ uint32_t ecb_unmix32 (uint32_t v)
+{
+  v ^= v >> 16          ; v *= 0x43021123U;
+  v ^= v >> 15 ^ v >> 30; v *= 0x1d69e2a5U;
+  v ^= v >> 16          ;
+  return v;
+}
+/* based on splitmix64, by Sebastiona Vigna, https://prng.di.unimi.it/splitmix64.c */
+ecb_function_ uint64_t ecb_mix64 (uint64_t v);
+ecb_function_ uint64_t ecb_mix64 (uint64_t v)
+{
+  v ^= v >> 30; v *= 0xbf58476d1ce4e5b9U;
+  v ^= v >> 27; v *= 0x94d049bb133111ebU;
+  v ^= v >> 31;
+  return v;
+}
+ecb_function_ uint64_t ecb_unmix64 (uint64_t v);
+ecb_function_ uint64_t ecb_unmix64 (uint64_t v)
+{
+  v ^= v >> 31 ^ v >> 62; v *= 0x319642b2d24d8ec3U;
+  v ^= v >> 27 ^ v >> 54; v *= 0x96de1b173f119089U;
+  v ^= v >> 30 ^ v >> 60;
+  return v;
+}
+ecb_function_ uintptr_t ecb_ptrmix (void *p);
+ecb_function_ uintptr_t ecb_ptrmix (void *p)
+{
+  #if ECB_PTRSIZE <= 4
+  return ecb_mix32 ((uint32_t)p);
+  #else
+  return ecb_mix64 ((uint64_t)p);
+  #endif
+}
+ecb_function_ void *ecb_ptrunmix (uintptr_t v);
+ecb_function_ void *ecb_ptrunmix (uintptr_t v)
+{
+  #if ECB_PTRSIZE <= 4
+  return (void *)ecb_unmix32 (v);
+  #else
+  return (void *)ecb_unmix64 (v);
+  #endif
+}
+#if ECB_CPP
+template<typename T>
+inline uintptr_t ecb_ptrmix (T *p)
+{
+  return ecb_ptrmix (static_cast<void *>(p));
+}
+template<typename T>
+inline T *ecb_ptrunmix (uintptr_t v)
+{
+  return static_cast<T *>(ecb_ptrunmix (v));
+}
 #endif
 /*****************************************************************************/
 /* division */
 }
 /*******************************************************************************/
 /* fast integer to ascii */
+/*
+ * This code is pretty complicated because it is general. The idea behind it,
+ * however, is pretty simple: first, the number is multiplied with a scaling
+ * factor (2**bits / 10**(digits-1)) to convert the integer into a fixed-point
+ * number with the first digit in the upper bits.
+ * Then this digit is converted to text and masked out. The resulting number
+ * is then multiplied by 10, by multiplying the fixed point representation
+ * by 5 and shifting the (binary) decimal point one to the right, so a 4.28
+ * format becomes 5.27, 6.26 and so on.
+ * The rest involves only advancing the pointer if we already generated a
+ * non-zero digit, so leading zeroes are overwritten.
+ */
-// simply return a mask with "bits" bits set
+/* simply return a mask with "bits" bits set *7
 #define ecb_i2a_mask(type,bits) ((((type)1) << (bits)) - 1)
-// oputput a single digit. maskvalue is 10**digitidx
+/* oputput a single digit. maskvalue is 10**digitidx */
 #define ecb_i2a_digit(type,bits,digitmask,maskvalue,digitidx) \
   if (digitmask >= maskvalue) /* constant, used to decide how many digits to generate */ \
     { \
       char digit = x >> (bits - digitidx); /* calculate the topmost digit */ \
       *ptr = digit + '0'; /* output it */ \
       nz = (digitmask == maskvalue) || nz || digit; /* first term == always output last digit */ \
       ptr += nz; /* output digit only if non-zero digit seen */ \
       x = (x & ecb_i2a_mask (type, bits - digitidx)) * 5; /* *10, but shift decimal point right */ \
     }
-// convert integer to fixed point format and multiply out digits, highest first
+/* convert integer to fixed point format and multiply out digits, highest first */
-// requires magic constants: max. digits and number of bits after the decimal point
+/* requires magic constants: max. digits and number of bits after the decimal point */
 #define ecb_i2a_def(suffix,ptr,v,type,bits,digitmask,lz) \
 ecb_inline char *ecb_i2a_ ## suffix (char *ptr, uint32_t u) \
 { \
   char nz = lz; /* non-zero digit seen? */ \
   /* convert to x.bits fixed-point */ \
   ecb_i2a_digit (type,bits,digitmask,  100000000, 8); \
   ecb_i2a_digit (type,bits,digitmask, 1000000000, 9); \
   return ptr; \
 }
-// predefined versions of the above, for various digits
+/* predefined versions of the above, for various digits */
-// ecb_i2a_xN = almost N digits, limit defined by macro
+/* ecb_i2a_xN = almost N digits, limit defined by macro */
-// ecb_i2a_N = up to N digits, leading zeroes suppressed
+/* ecb_i2a_N = up to N digits, leading zeroes suppressed */
-// ecb_i2a_0N = exactly N digits, including leading zeroes
+/* ecb_i2a_0N = exactly N digits, including leading zeroes */
-// non-leading-zero versions, limited range
+/* non-leading-zero versions, limited range */
-#define ECB_I2A_MAX_X5       59074 // limit for ecb_i2a_x5
+#define ECB_I2A_MAX_X5       59074 /* limit for ecb_i2a_x5 */
-#define ECB_I2A_MAX_X10 2932500665 // limit for ecb_i2a_x10
+#define ECB_I2A_MAX_X10 2932500665 /* limit for ecb_i2a_x10 */
 ecb_i2a_def ( x5, ptr, v, uint32_t, 26,      10000, 0)
 ecb_i2a_def (x10, ptr, v, uint64_t, 60, 1000000000, 0)
-// non-leading zero versions, all digits, 4 and 9 are optimal for 32/64 bit
+/* non-leading zero versions, all digits, 4 and 9 are optimal for 32/64 bit */
-ecb_i2a_def ( 2, ptr, v, uint32_t, 10,         10, 0)
+ecb_i2a_def ( 2, ptr, v, uint32_t, 10,          10, 0)
-ecb_i2a_def ( 3, ptr, v, uint32_t, 12,        100, 0)
+ecb_i2a_def ( 3, ptr, v, uint32_t, 12,         100, 0)
-ecb_i2a_def ( 4, ptr, v, uint32_t, 26,       1000, 0)
+ecb_i2a_def ( 4, ptr, v, uint32_t, 26,        1000, 0)
-ecb_i2a_def ( 5, ptr, v, uint64_t, 30,      10000, 0)
+ecb_i2a_def ( 5, ptr, v, uint64_t, 30,       10000, 0)
-ecb_i2a_def ( 6, ptr, v, uint64_t, 36,     100000, 0)
+ecb_i2a_def ( 6, ptr, v, uint64_t, 36,      100000, 0)
-ecb_i2a_def ( 7, ptr, v, uint64_t, 44,    1000000, 0)
+ecb_i2a_def ( 7, ptr, v, uint64_t, 44,     1000000, 0)
-ecb_i2a_def ( 8, ptr, v, uint64_t, 50,   10000000, 0)
+ecb_i2a_def ( 8, ptr, v, uint64_t, 50,    10000000, 0)
-ecb_i2a_def ( 9, ptr, v, uint64_t, 56,  100000000, 0)
+ecb_i2a_def ( 9, ptr, v, uint64_t, 56,   100000000, 0)
-// leading-zero versions, all digits, 04 and 09 are optimal for 32/64 bit
+/* leading-zero versions, all digits, 04 and 09 are optimal for 32/64 bit */
-ecb_i2a_def (02, ptr, v, uint32_t, 10,         10, 1)
+ecb_i2a_def (02, ptr, v, uint32_t, 10,          10, 1)
-ecb_i2a_def (03, ptr, v, uint32_t, 12,        100, 1)
+ecb_i2a_def (03, ptr, v, uint32_t, 12,         100, 1)
-ecb_i2a_def (04, ptr, v, uint32_t, 26,       1000, 1)
+ecb_i2a_def (04, ptr, v, uint32_t, 26,        1000, 1)
-ecb_i2a_def (05, ptr, v, uint64_t, 30,      10000, 1)
+ecb_i2a_def (05, ptr, v, uint64_t, 30,       10000, 1)
-ecb_i2a_def (06, ptr, v, uint64_t, 36,     100000, 1)
+ecb_i2a_def (06, ptr, v, uint64_t, 36,      100000, 1)
-ecb_i2a_def (07, ptr, v, uint64_t, 44,    1000000, 1)
+ecb_i2a_def (07, ptr, v, uint64_t, 44,     1000000, 1)
-ecb_i2a_def (08, ptr, v, uint64_t, 50,   10000000, 1)
+ecb_i2a_def (08, ptr, v, uint64_t, 50,    10000000, 1)
-ecb_i2a_def (09, ptr, v, uint64_t, 56,  100000000, 1)
+ecb_i2a_def (09, ptr, v, uint64_t, 56,   100000000, 1)
 #define ECB_I2A_I32_DIGITS 11
 #define ECB_I2A_U32_DIGITS 10
 #define ECB_I2A_I64_DIGITS 20
-#define ECB_I2A_U32_DIGITS 21
+#define ECB_I2A_U64_DIGITS 21
-#define ECB_I2A_DIGITS     21
+#define ECB_I2A_MAX_DIGITS 21
 ecb_inline char *
 ecb_i2a_u32 (char *ptr, uint32_t u)
 {
   #if ECB_64BIT_NATIVE
     if (ecb_expect_true (u <= ECB_I2A_MAX_X10))
       ptr = ecb_i2a_x10 (ptr, u);
-    else // x10 almost, but not fully, covers 32 bit
+    else /* x10 almost, but not fully, covers 32 bit */
       {
         uint32_t u1 = u % 1000000000;
         uint32_t u2 = u / 1000000000;
         *ptr++ = u2 + '0';
 {
   *ptr = '-'; ptr += v < 0;
   uint32_t u = v < 0 ? -(uint32_t)v : v;
   #if ECB_64BIT_NATIVE
-    ptr = ecb_i2a_x10 (ptr, u); // x10 fully covers 31 bit
+    ptr = ecb_i2a_x10 (ptr, u); /* x10 fully covers 31 bit */
   #else
     ptr = ecb_i2a_u32 (ptr, u);
   #endif
   return ptr;
         uint64_t u1 = u  % 1000000000;
         uint64_t ua = u  / 1000000000;
         uint64_t u2 = ua % 1000000000;
         uint64_t u3 = ua / 1000000000;
-        // 2**31 is 19 digits, so the top is exactly one digit
+        /* 2**31 is 19 digits, so the top is exactly one digit */
         *ptr++ = u3 + '0';
         ptr = ecb_i2a_09 (ptr, u2);
         ptr = ecb_i2a_09 (ptr, u1);
       }
   #else

Diff Legend

-–
+Removed lines
-+
+Added lines
-<
+Changed lines
->
+Changed lines

Comparing libecb/ecb.h (file contents): Revision 1.192 by root, Mon Jun 21 23:59:58 2021 UTC vs. Revision 1.200 by root, Fri Aug 20 20:12:33 2021 UTC

Diff Legend

Comparing libecb/ecb.h (file contents):
Revision 1.192 by root, Mon Jun 21 23:59:58 2021 UTC vs.
Revision 1.200 by root, Fri Aug 20 20:12:33 2021 UTC