ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/libev/ev.c
(Generate patch)

Comparing libev/ev.c (file contents):
Revision 1.464 by root, Fri Mar 21 16:41:04 2014 UTC vs.
Revision 1.479 by root, Sun Dec 20 01:31:17 2015 UTC

43# include EV_CONFIG_H 43# include EV_CONFIG_H
44# else 44# else
45# include "config.h" 45# include "config.h"
46# endif 46# endif
47 47
48#if HAVE_FLOOR 48# if HAVE_FLOOR
49# ifndef EV_USE_FLOOR 49# ifndef EV_USE_FLOOR
50# define EV_USE_FLOOR 1 50# define EV_USE_FLOOR 1
51# endif
51# endif 52# endif
52#endif
53 53
54# if HAVE_CLOCK_SYSCALL 54# if HAVE_CLOCK_SYSCALL
55# ifndef EV_USE_CLOCK_SYSCALL 55# ifndef EV_USE_CLOCK_SYSCALL
56# define EV_USE_CLOCK_SYSCALL 1 56# define EV_USE_CLOCK_SYSCALL 1
57# ifndef EV_USE_REALTIME 57# ifndef EV_USE_REALTIME
256# else 256# else
257# define EV_USE_CLOCK_SYSCALL 0 257# define EV_USE_CLOCK_SYSCALL 0
258# endif 258# endif
259#endif 259#endif
260 260
261#if !(_POSIX_TIMERS > 0)
262# ifndef EV_USE_MONOTONIC
263# define EV_USE_MONOTONIC 0
264# endif
265# ifndef EV_USE_REALTIME
266# define EV_USE_REALTIME 0
267# endif
268#endif
269
261#ifndef EV_USE_MONOTONIC 270#ifndef EV_USE_MONOTONIC
262# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0 271# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0
263# define EV_USE_MONOTONIC EV_FEATURE_OS 272# define EV_USE_MONOTONIC EV_FEATURE_OS
264# else 273# else
265# define EV_USE_MONOTONIC 0 274# define EV_USE_MONOTONIC 0
482/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */ 491/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */
483/* ECB.H BEGIN */ 492/* ECB.H BEGIN */
484/* 493/*
485 * libecb - http://software.schmorp.de/pkg/libecb 494 * libecb - http://software.schmorp.de/pkg/libecb
486 * 495 *
487 * Copyright (©) 2009-2014 Marc Alexander Lehmann <libecb@schmorp.de> 496 * Copyright (©) 2009-2015 Marc Alexander Lehmann <libecb@schmorp.de>
488 * Copyright (©) 2011 Emanuele Giaquinta 497 * Copyright (©) 2011 Emanuele Giaquinta
489 * All rights reserved. 498 * All rights reserved.
490 * 499 *
491 * Redistribution and use in source and binary forms, with or without modifica- 500 * Redistribution and use in source and binary forms, with or without modifica-
492 * tion, are permitted provided that the following conditions are met: 501 * tion, are permitted provided that the following conditions are met:
506 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; 515 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
507 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, 516 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
508 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH- 517 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH-
509 * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED 518 * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
510 * OF THE POSSIBILITY OF SUCH DAMAGE. 519 * OF THE POSSIBILITY OF SUCH DAMAGE.
520 *
521 * Alternatively, the contents of this file may be used under the terms of
522 * the GNU General Public License ("GPL") version 2 or any later version,
523 * in which case the provisions of the GPL are applicable instead of
524 * the above. If you wish to allow the use of your version of this file
525 * only under the terms of the GPL and not to allow others to use your
526 * version of this file under the BSD license, indicate your decision
527 * by deleting the provisions above and replace them with the notice
528 * and other provisions required by the GPL. If you do not delete the
529 * provisions above, a recipient may use your version of this file under
530 * either the BSD or the GPL.
511 */ 531 */
512 532
513#ifndef ECB_H 533#ifndef ECB_H
514#define ECB_H 534#define ECB_H
515 535
516/* 16 bits major, 16 bits minor */ 536/* 16 bits major, 16 bits minor */
517#define ECB_VERSION 0x00010003 537#define ECB_VERSION 0x00010005
518 538
519#ifdef _WIN32 539#ifdef _WIN32
520 typedef signed char int8_t; 540 typedef signed char int8_t;
521 typedef unsigned char uint8_t; 541 typedef unsigned char uint8_t;
522 typedef signed short int16_t; 542 typedef signed short int16_t;
539 typedef uint32_t uintptr_t; 559 typedef uint32_t uintptr_t;
540 typedef int32_t intptr_t; 560 typedef int32_t intptr_t;
541 #endif 561 #endif
542#else 562#else
543 #include <inttypes.h> 563 #include <inttypes.h>
544 #if UINTMAX_MAX > 0xffffffffU 564 #if (defined INTPTR_MAX ? INTPTR_MAX : ULONG_MAX) > 0xffffffffU
545 #define ECB_PTRSIZE 8 565 #define ECB_PTRSIZE 8
546 #else 566 #else
547 #define ECB_PTRSIZE 4 567 #define ECB_PTRSIZE 4
548 #endif 568 #endif
549#endif 569#endif
550 570
571#define ECB_GCC_AMD64 (__amd64 || __amd64__ || __x86_64 || __x86_64__)
572#define ECB_MSVC_AMD64 (_M_AMD64 || _M_X64)
573
551/* work around x32 idiocy by defining proper macros */ 574/* work around x32 idiocy by defining proper macros */
552#if __amd64 || __x86_64 || _M_AMD64 || _M_X64 575#if ECB_GCC_AMD64 || ECB_MSVC_AMD64
553 #if _ILP32 576 #if _ILP32
554 #define ECB_AMD64_X32 1 577 #define ECB_AMD64_X32 1
555 #else 578 #else
556 #define ECB_AMD64 1 579 #define ECB_AMD64 1
557 #endif 580 #endif
562 * causing enormous grief in return for some better fake benchmark numbers. 585 * causing enormous grief in return for some better fake benchmark numbers.
563 * or so. 586 * or so.
564 * we try to detect these and simply assume they are not gcc - if they have 587 * we try to detect these and simply assume they are not gcc - if they have
565 * an issue with that they should have done it right in the first place. 588 * an issue with that they should have done it right in the first place.
566 */ 589 */
567#ifndef ECB_GCC_VERSION
568 #if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__ 590#if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__
569 #define ECB_GCC_VERSION(major,minor) 0 591 #define ECB_GCC_VERSION(major,minor) 0
570 #else 592#else
571 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor))) 593 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor)))
572 #endif 594#endif
595
596#define ECB_CLANG_VERSION(major,minor) (__clang_major__ > (major) || (__clang_major__ == (major) && __clang_minor__ >= (minor)))
597
598#if __clang__ && defined __has_builtin
599 #define ECB_CLANG_BUILTIN(x) __has_builtin (x)
600#else
601 #define ECB_CLANG_BUILTIN(x) 0
602#endif
603
604#if __clang__ && defined __has_extension
605 #define ECB_CLANG_EXTENSION(x) __has_extension (x)
606#else
607 #define ECB_CLANG_EXTENSION(x) 0
573#endif 608#endif
574 609
575#define ECB_CPP (__cplusplus+0) 610#define ECB_CPP (__cplusplus+0)
576#define ECB_CPP11 (__cplusplus >= 201103L) 611#define ECB_CPP11 (__cplusplus >= 201103L)
577 612
605 #define ECB_NO_SMP 1 640 #define ECB_NO_SMP 1
606#endif 641#endif
607 642
608#if ECB_NO_SMP 643#if ECB_NO_SMP
609 #define ECB_MEMORY_FENCE do { } while (0) 644 #define ECB_MEMORY_FENCE do { } while (0)
645#endif
646
647/* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/compiler_ref/compiler_builtins.html */
648#if __xlC__ && ECB_CPP
649 #include <builtins.h>
650#endif
651
652#if 1400 <= _MSC_VER
653 #include <intrin.h> /* fence functions _ReadBarrier, also bit search functions _BitScanReverse */
610#endif 654#endif
611 655
612#ifndef ECB_MEMORY_FENCE 656#ifndef ECB_MEMORY_FENCE
613 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110 657 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110
614 #if __i386 || __i386__ 658 #if __i386 || __i386__
615 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory") 659 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory")
616 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory") 660 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
617 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 661 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
618 #elif __amd64 || __amd64__ || __x86_64 || __x86_64__ 662 #elif ECB_GCC_AMD64
619 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory") 663 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory")
620 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory") 664 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
621 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 665 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
622 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ 666 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__
623 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory") 667 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory")
668 #elif defined __ARM_ARCH_2__ \
669 || defined __ARM_ARCH_3__ || defined __ARM_ARCH_3M__ \
670 || defined __ARM_ARCH_4__ || defined __ARM_ARCH_4T__ \
671 || defined __ARM_ARCH_5__ || defined __ARM_ARCH_5E__ \
672 || defined __ARM_ARCH_5T__ || defined __ARM_ARCH_5TE__ \
673 || defined __ARM_ARCH_5TEJ__
674 /* should not need any, unless running old code on newer cpu - arm doesn't support that */
624 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \ 675 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \
625 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ 676 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ \
677 || defined __ARM_ARCH_6T2__
626 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory") 678 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory")
627 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \ 679 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \
628 || defined __ARM_ARCH_7M__ || defined __ARM_ARCH_7R__ 680 || defined __ARM_ARCH_7R__ || defined __ARM_ARCH_7M__
629 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory") 681 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory")
630 #elif __aarch64__ 682 #elif __aarch64__
631 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb ish" : : : "memory") 683 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb ish" : : : "memory")
632 #elif (__sparc || __sparc__) && !__sparcv8 684 #elif (__sparc || __sparc__) && !(__sparc_v8__ || defined __sparcv8)
633 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory") 685 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory")
634 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory") 686 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory")
635 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore") 687 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore")
636 #elif defined __s390__ || defined __s390x__ 688 #elif defined __s390__ || defined __s390x__
637 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory") 689 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory")
661 /* see comment below (stdatomic.h) about the C11 memory model. */ 713 /* see comment below (stdatomic.h) about the C11 memory model. */
662 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST) 714 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST)
663 #define ECB_MEMORY_FENCE_ACQUIRE __atomic_thread_fence (__ATOMIC_ACQUIRE) 715 #define ECB_MEMORY_FENCE_ACQUIRE __atomic_thread_fence (__ATOMIC_ACQUIRE)
664 #define ECB_MEMORY_FENCE_RELEASE __atomic_thread_fence (__ATOMIC_RELEASE) 716 #define ECB_MEMORY_FENCE_RELEASE __atomic_thread_fence (__ATOMIC_RELEASE)
665 717
666 /* The __has_feature syntax from clang is so misdesigned that we cannot use it 718 #elif ECB_CLANG_EXTENSION(c_atomic)
667 * without risking compile time errors with other compilers. We *could*
668 * define our own ecb_clang_has_feature, but I just can't be bothered to work
669 * around this shit time and again.
670 * #elif defined __clang && __has_feature (cxx_atomic)
671 * // see comment below (stdatomic.h) about the C11 memory model. 719 /* see comment below (stdatomic.h) about the C11 memory model. */
672 * #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST) 720 #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST)
673 * #define ECB_MEMORY_FENCE_ACQUIRE __c11_atomic_thread_fence (__ATOMIC_ACQUIRE) 721 #define ECB_MEMORY_FENCE_ACQUIRE __c11_atomic_thread_fence (__ATOMIC_ACQUIRE)
674 * #define ECB_MEMORY_FENCE_RELEASE __c11_atomic_thread_fence (__ATOMIC_RELEASE) 722 #define ECB_MEMORY_FENCE_RELEASE __c11_atomic_thread_fence (__ATOMIC_RELEASE)
675 */
676 723
677 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__ 724 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__
678 #define ECB_MEMORY_FENCE __sync_synchronize () 725 #define ECB_MEMORY_FENCE __sync_synchronize ()
679 #elif _MSC_VER >= 1500 /* VC++ 2008 */ 726 #elif _MSC_VER >= 1500 /* VC++ 2008 */
680 /* apparently, microsoft broke all the memory barrier stuff in Visual Studio 2008... */ 727 /* apparently, microsoft broke all the memory barrier stuff in Visual Studio 2008... */
743 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE 790 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE
744#endif 791#endif
745 792
746/*****************************************************************************/ 793/*****************************************************************************/
747 794
748#if __cplusplus 795#if ECB_CPP
749 #define ecb_inline static inline 796 #define ecb_inline static inline
750#elif ECB_GCC_VERSION(2,5) 797#elif ECB_GCC_VERSION(2,5)
751 #define ecb_inline static __inline__ 798 #define ecb_inline static __inline__
752#elif ECB_C99 799#elif ECB_C99
753 #define ecb_inline static inline 800 #define ecb_inline static inline
767 814
768#define ECB_CONCAT_(a, b) a ## b 815#define ECB_CONCAT_(a, b) a ## b
769#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b) 816#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b)
770#define ECB_STRINGIFY_(a) # a 817#define ECB_STRINGIFY_(a) # a
771#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a) 818#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a)
819#define ECB_STRINGIFY_EXPR(expr) ((expr), ECB_STRINGIFY_ (expr))
772 820
773#define ecb_function_ ecb_inline 821#define ecb_function_ ecb_inline
774 822
775#if ECB_GCC_VERSION(3,1) 823#if ECB_GCC_VERSION(3,1) || ECB_CLANG_VERSION(2,8)
776 #define ecb_attribute(attrlist) __attribute__(attrlist) 824 #define ecb_attribute(attrlist) __attribute__ (attrlist)
825#else
826 #define ecb_attribute(attrlist)
827#endif
828
829#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_constant_p)
777 #define ecb_is_constant(expr) __builtin_constant_p (expr) 830 #define ecb_is_constant(expr) __builtin_constant_p (expr)
778 #define ecb_expect(expr,value) __builtin_expect ((expr),(value))
779 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality)
780#else 831#else
781 #define ecb_attribute(attrlist)
782
783 /* possible C11 impl for integral types 832 /* possible C11 impl for integral types
784 typedef struct ecb_is_constant_struct ecb_is_constant_struct; 833 typedef struct ecb_is_constant_struct ecb_is_constant_struct;
785 #define ecb_is_constant(expr) _Generic ((1 ? (struct ecb_is_constant_struct *)0 : (void *)((expr) - (expr)), ecb_is_constant_struct *: 0, default: 1)) */ 834 #define ecb_is_constant(expr) _Generic ((1 ? (struct ecb_is_constant_struct *)0 : (void *)((expr) - (expr)), ecb_is_constant_struct *: 0, default: 1)) */
786 835
787 #define ecb_is_constant(expr) 0 836 #define ecb_is_constant(expr) 0
837#endif
838
839#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_expect)
840 #define ecb_expect(expr,value) __builtin_expect ((expr),(value))
841#else
788 #define ecb_expect(expr,value) (expr) 842 #define ecb_expect(expr,value) (expr)
843#endif
844
845#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_prefetch)
846 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality)
847#else
789 #define ecb_prefetch(addr,rw,locality) 848 #define ecb_prefetch(addr,rw,locality)
790#endif 849#endif
791 850
792/* no emulation for ecb_decltype */ 851/* no emulation for ecb_decltype */
793#if ECB_GCC_VERSION(4,5) 852#if ECB_CPP11
853 // older implementations might have problems with decltype(x)::type, work around it
854 template<class T> struct ecb_decltype_t { typedef T type; };
794 #define ecb_decltype(x) __decltype(x) 855 #define ecb_decltype(x) ecb_decltype_t<decltype (x)>::type
795#elif ECB_GCC_VERSION(3,0) 856#elif ECB_GCC_VERSION(3,0) || ECB_CLANG_VERSION(2,8)
796 #define ecb_decltype(x) __typeof(x) 857 #define ecb_decltype(x) __typeof__ (x)
797#endif 858#endif
798 859
860#if _MSC_VER >= 1300
861 #define ecb_deprecated __declspec (deprecated)
862#else
863 #define ecb_deprecated ecb_attribute ((__deprecated__))
864#endif
865
866#if _MSC_VER >= 1500
867 #define ecb_deprecated_message(msg) __declspec (deprecated (msg))
868#elif ECB_GCC_VERSION(4,5)
869 #define ecb_deprecated_message(msg) ecb_attribute ((__deprecated__ (msg))
870#else
871 #define ecb_deprecated_message(msg) ecb_deprecated
872#endif
873
874#if _MSC_VER >= 1400
875 #define ecb_noinline __declspec (noinline)
876#else
799#define ecb_noinline ecb_attribute ((__noinline__)) 877 #define ecb_noinline ecb_attribute ((__noinline__))
878#endif
879
800#define ecb_unused ecb_attribute ((__unused__)) 880#define ecb_unused ecb_attribute ((__unused__))
801#define ecb_const ecb_attribute ((__const__)) 881#define ecb_const ecb_attribute ((__const__))
802#define ecb_pure ecb_attribute ((__pure__)) 882#define ecb_pure ecb_attribute ((__pure__))
803 883
804#if ECB_C11 884#if ECB_C11 || __IBMC_NORETURN
885 /* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/language_ref/noreturn.html */
805 #define ecb_noreturn _Noreturn 886 #define ecb_noreturn _Noreturn
887#elif ECB_CPP11
888 #define ecb_noreturn [[noreturn]]
889#elif _MSC_VER >= 1200
890 /* http://msdn.microsoft.com/en-us/library/k6ktzx3s.aspx */
891 #define ecb_noreturn __declspec (noreturn)
806#else 892#else
807 #define ecb_noreturn ecb_attribute ((__noreturn__)) 893 #define ecb_noreturn ecb_attribute ((__noreturn__))
808#endif 894#endif
809 895
810#if ECB_GCC_VERSION(4,3) 896#if ECB_GCC_VERSION(4,3)
825/* for compatibility to the rest of the world */ 911/* for compatibility to the rest of the world */
826#define ecb_likely(expr) ecb_expect_true (expr) 912#define ecb_likely(expr) ecb_expect_true (expr)
827#define ecb_unlikely(expr) ecb_expect_false (expr) 913#define ecb_unlikely(expr) ecb_expect_false (expr)
828 914
829/* count trailing zero bits and count # of one bits */ 915/* count trailing zero bits and count # of one bits */
830#if ECB_GCC_VERSION(3,4) 916#if ECB_GCC_VERSION(3,4) \
917 || (ECB_CLANG_BUILTIN(__builtin_clz) && ECB_CLANG_BUILTIN(__builtin_clzll) \
918 && ECB_CLANG_BUILTIN(__builtin_ctz) && ECB_CLANG_BUILTIN(__builtin_ctzll) \
919 && ECB_CLANG_BUILTIN(__builtin_popcount))
831 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */ 920 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */
832 #define ecb_ld32(x) (__builtin_clz (x) ^ 31) 921 #define ecb_ld32(x) (__builtin_clz (x) ^ 31)
833 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63) 922 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63)
834 #define ecb_ctz32(x) __builtin_ctz (x) 923 #define ecb_ctz32(x) __builtin_ctz (x)
835 #define ecb_ctz64(x) __builtin_ctzll (x) 924 #define ecb_ctz64(x) __builtin_ctzll (x)
836 #define ecb_popcount32(x) __builtin_popcount (x) 925 #define ecb_popcount32(x) __builtin_popcount (x)
837 /* no popcountll */ 926 /* no popcountll */
838#else 927#else
839 ecb_function_ int ecb_ctz32 (uint32_t x) ecb_const; 928 ecb_function_ ecb_const int ecb_ctz32 (uint32_t x);
840 ecb_function_ int 929 ecb_function_ ecb_const int
841 ecb_ctz32 (uint32_t x) 930 ecb_ctz32 (uint32_t x)
842 { 931 {
932#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
933 unsigned long r;
934 _BitScanForward (&r, x);
935 return (int)r;
936#else
843 int r = 0; 937 int r = 0;
844 938
845 x &= ~x + 1; /* this isolates the lowest bit */ 939 x &= ~x + 1; /* this isolates the lowest bit */
846 940
847#if ECB_branchless_on_i386 941#if ECB_branchless_on_i386
857 if (x & 0xff00ff00) r += 8; 951 if (x & 0xff00ff00) r += 8;
858 if (x & 0xffff0000) r += 16; 952 if (x & 0xffff0000) r += 16;
859#endif 953#endif
860 954
861 return r; 955 return r;
956#endif
862 } 957 }
863 958
864 ecb_function_ int ecb_ctz64 (uint64_t x) ecb_const; 959 ecb_function_ ecb_const int ecb_ctz64 (uint64_t x);
865 ecb_function_ int 960 ecb_function_ ecb_const int
866 ecb_ctz64 (uint64_t x) 961 ecb_ctz64 (uint64_t x)
867 { 962 {
963#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
964 unsigned long r;
965 _BitScanForward64 (&r, x);
966 return (int)r;
967#else
868 int shift = x & 0xffffffffU ? 0 : 32; 968 int shift = x & 0xffffffff ? 0 : 32;
869 return ecb_ctz32 (x >> shift) + shift; 969 return ecb_ctz32 (x >> shift) + shift;
970#endif
870 } 971 }
871 972
872 ecb_function_ int ecb_popcount32 (uint32_t x) ecb_const; 973 ecb_function_ ecb_const int ecb_popcount32 (uint32_t x);
873 ecb_function_ int 974 ecb_function_ ecb_const int
874 ecb_popcount32 (uint32_t x) 975 ecb_popcount32 (uint32_t x)
875 { 976 {
876 x -= (x >> 1) & 0x55555555; 977 x -= (x >> 1) & 0x55555555;
877 x = ((x >> 2) & 0x33333333) + (x & 0x33333333); 978 x = ((x >> 2) & 0x33333333) + (x & 0x33333333);
878 x = ((x >> 4) + x) & 0x0f0f0f0f; 979 x = ((x >> 4) + x) & 0x0f0f0f0f;
879 x *= 0x01010101; 980 x *= 0x01010101;
880 981
881 return x >> 24; 982 return x >> 24;
882 } 983 }
883 984
884 ecb_function_ int ecb_ld32 (uint32_t x) ecb_const; 985 ecb_function_ ecb_const int ecb_ld32 (uint32_t x);
885 ecb_function_ int ecb_ld32 (uint32_t x) 986 ecb_function_ ecb_const int ecb_ld32 (uint32_t x)
886 { 987 {
988#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
989 unsigned long r;
990 _BitScanReverse (&r, x);
991 return (int)r;
992#else
887 int r = 0; 993 int r = 0;
888 994
889 if (x >> 16) { x >>= 16; r += 16; } 995 if (x >> 16) { x >>= 16; r += 16; }
890 if (x >> 8) { x >>= 8; r += 8; } 996 if (x >> 8) { x >>= 8; r += 8; }
891 if (x >> 4) { x >>= 4; r += 4; } 997 if (x >> 4) { x >>= 4; r += 4; }
892 if (x >> 2) { x >>= 2; r += 2; } 998 if (x >> 2) { x >>= 2; r += 2; }
893 if (x >> 1) { r += 1; } 999 if (x >> 1) { r += 1; }
894 1000
895 return r; 1001 return r;
1002#endif
896 } 1003 }
897 1004
898 ecb_function_ int ecb_ld64 (uint64_t x) ecb_const; 1005 ecb_function_ ecb_const int ecb_ld64 (uint64_t x);
899 ecb_function_ int ecb_ld64 (uint64_t x) 1006 ecb_function_ ecb_const int ecb_ld64 (uint64_t x)
900 { 1007 {
1008#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
1009 unsigned long r;
1010 _BitScanReverse64 (&r, x);
1011 return (int)r;
1012#else
901 int r = 0; 1013 int r = 0;
902 1014
903 if (x >> 32) { x >>= 32; r += 32; } 1015 if (x >> 32) { x >>= 32; r += 32; }
904 1016
905 return r + ecb_ld32 (x); 1017 return r + ecb_ld32 (x);
1018#endif
906 } 1019 }
907#endif 1020#endif
908 1021
909ecb_function_ ecb_bool ecb_is_pot32 (uint32_t x) ecb_const; 1022ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x);
910ecb_function_ ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); } 1023ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); }
911ecb_function_ ecb_bool ecb_is_pot64 (uint64_t x) ecb_const; 1024ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x);
912ecb_function_ ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); } 1025ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); }
913 1026
914ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) ecb_const; 1027ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x);
915ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) 1028ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x)
916{ 1029{
917 return ( (x * 0x0802U & 0x22110U) 1030 return ( (x * 0x0802U & 0x22110U)
918 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16; 1031 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16;
919} 1032}
920 1033
921ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) ecb_const; 1034ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x);
922ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) 1035ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x)
923{ 1036{
924 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1); 1037 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1);
925 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2); 1038 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2);
926 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4); 1039 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4);
927 x = ( x >> 8 ) | ( x << 8); 1040 x = ( x >> 8 ) | ( x << 8);
928 1041
929 return x; 1042 return x;
930} 1043}
931 1044
932ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) ecb_const; 1045ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x);
933ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) 1046ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x)
934{ 1047{
935 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1); 1048 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1);
936 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2); 1049 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2);
937 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4); 1050 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4);
938 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8); 1051 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8);
941 return x; 1054 return x;
942} 1055}
943 1056
944/* popcount64 is only available on 64 bit cpus as gcc builtin */ 1057/* popcount64 is only available on 64 bit cpus as gcc builtin */
945/* so for this version we are lazy */ 1058/* so for this version we are lazy */
946ecb_function_ int ecb_popcount64 (uint64_t x) ecb_const; 1059ecb_function_ ecb_const int ecb_popcount64 (uint64_t x);
947ecb_function_ int 1060ecb_function_ ecb_const int
948ecb_popcount64 (uint64_t x) 1061ecb_popcount64 (uint64_t x)
949{ 1062{
950 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32); 1063 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32);
951} 1064}
952 1065
953ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) ecb_const; 1066ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count);
954ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) ecb_const; 1067ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count);
955ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) ecb_const; 1068ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count);
956ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) ecb_const; 1069ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count);
957ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) ecb_const; 1070ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count);
958ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) ecb_const; 1071ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count);
959ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) ecb_const; 1072ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count);
960ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) ecb_const; 1073ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count);
961 1074
962ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); } 1075ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); }
963ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); } 1076ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); }
964ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); } 1077ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); }
965ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); } 1078ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); }
966ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); } 1079ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); }
967ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); } 1080ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); }
968ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); } 1081ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); }
969ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); } 1082ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); }
970 1083
971#if ECB_GCC_VERSION(4,3) 1084#if ECB_GCC_VERSION(4,3) || (ECB_CLANG_BUILTIN(__builtin_bswap32) && ECB_CLANG_BUILTIN(__builtin_bswap64))
1085 #if ECB_GCC_VERSION(4,8) || ECB_CLANG_BUILTIN(__builtin_bswap16)
1086 #define ecb_bswap16(x) __builtin_bswap16 (x)
1087 #else
972 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16) 1088 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16)
1089 #endif
973 #define ecb_bswap32(x) __builtin_bswap32 (x) 1090 #define ecb_bswap32(x) __builtin_bswap32 (x)
974 #define ecb_bswap64(x) __builtin_bswap64 (x) 1091 #define ecb_bswap64(x) __builtin_bswap64 (x)
1092#elif _MSC_VER
1093 #include <stdlib.h>
1094 #define ecb_bswap16(x) ((uint16_t)_byteswap_ushort ((uint16_t)(x)))
1095 #define ecb_bswap32(x) ((uint32_t)_byteswap_ulong ((uint32_t)(x)))
1096 #define ecb_bswap64(x) ((uint64_t)_byteswap_uint64 ((uint64_t)(x)))
975#else 1097#else
976 ecb_function_ uint16_t ecb_bswap16 (uint16_t x) ecb_const; 1098 ecb_function_ ecb_const uint16_t ecb_bswap16 (uint16_t x);
977 ecb_function_ uint16_t 1099 ecb_function_ ecb_const uint16_t
978 ecb_bswap16 (uint16_t x) 1100 ecb_bswap16 (uint16_t x)
979 { 1101 {
980 return ecb_rotl16 (x, 8); 1102 return ecb_rotl16 (x, 8);
981 } 1103 }
982 1104
983 ecb_function_ uint32_t ecb_bswap32 (uint32_t x) ecb_const; 1105 ecb_function_ ecb_const uint32_t ecb_bswap32 (uint32_t x);
984 ecb_function_ uint32_t 1106 ecb_function_ ecb_const uint32_t
985 ecb_bswap32 (uint32_t x) 1107 ecb_bswap32 (uint32_t x)
986 { 1108 {
987 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16); 1109 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16);
988 } 1110 }
989 1111
990 ecb_function_ uint64_t ecb_bswap64 (uint64_t x) ecb_const; 1112 ecb_function_ ecb_const uint64_t ecb_bswap64 (uint64_t x);
991 ecb_function_ uint64_t 1113 ecb_function_ ecb_const uint64_t
992 ecb_bswap64 (uint64_t x) 1114 ecb_bswap64 (uint64_t x)
993 { 1115 {
994 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32); 1116 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32);
995 } 1117 }
996#endif 1118#endif
997 1119
998#if ECB_GCC_VERSION(4,5) 1120#if ECB_GCC_VERSION(4,5) || ECB_CLANG_BUILTIN(__builtin_unreachable)
999 #define ecb_unreachable() __builtin_unreachable () 1121 #define ecb_unreachable() __builtin_unreachable ()
1000#else 1122#else
1001 /* this seems to work fine, but gcc always emits a warning for it :/ */ 1123 /* this seems to work fine, but gcc always emits a warning for it :/ */
1002 ecb_inline void ecb_unreachable (void) ecb_noreturn; 1124 ecb_inline ecb_noreturn void ecb_unreachable (void);
1003 ecb_inline void ecb_unreachable (void) { } 1125 ecb_inline ecb_noreturn void ecb_unreachable (void) { }
1004#endif 1126#endif
1005 1127
1006/* try to tell the compiler that some condition is definitely true */ 1128/* try to tell the compiler that some condition is definitely true */
1007#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0 1129#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0
1008 1130
1009ecb_inline unsigned char ecb_byteorder_helper (void) ecb_const; 1131ecb_inline ecb_const uint32_t ecb_byteorder_helper (void);
1010ecb_inline unsigned char 1132ecb_inline ecb_const uint32_t
1011ecb_byteorder_helper (void) 1133ecb_byteorder_helper (void)
1012{ 1134{
1013 /* the union code still generates code under pressure in gcc, */ 1135 /* the union code still generates code under pressure in gcc, */
1014 /* but less than using pointers, and always seems to */ 1136 /* but less than using pointers, and always seems to */
1015 /* successfully return a constant. */ 1137 /* successfully return a constant. */
1016 /* the reason why we have this horrible preprocessor mess */ 1138 /* the reason why we have this horrible preprocessor mess */
1017 /* is to avoid it in all cases, at least on common architectures */ 1139 /* is to avoid it in all cases, at least on common architectures */
1018 /* or when using a recent enough gcc version (>= 4.6) */ 1140 /* or when using a recent enough gcc version (>= 4.6) */
1019#if __i386 || __i386__ || _M_X86 || __amd64 || __amd64__ || _M_X64
1020 return 0x44;
1021#elif __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__ 1141#if (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__) \
1142 || ((__i386 || __i386__ || _M_IX86 || ECB_GCC_AMD64 || ECB_MSVC_AMD64) && !__VOS__)
1143 #define ECB_LITTLE_ENDIAN 1
1022 return 0x44; 1144 return 0x44332211;
1023#elif __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__ 1145#elif (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__) \
1146 || ((__AARCH64EB__ || __MIPSEB__ || __ARMEB__) && !__VOS__)
1147 #define ECB_BIG_ENDIAN 1
1024 return 0x11; 1148 return 0x11223344;
1025#else 1149#else
1026 union 1150 union
1027 { 1151 {
1152 uint8_t c[4];
1028 uint32_t i; 1153 uint32_t u;
1029 uint8_t c;
1030 } u = { 0x11223344 }; 1154 } u = { 0x11, 0x22, 0x33, 0x44 };
1031 return u.c; 1155 return u.u;
1032#endif 1156#endif
1033} 1157}
1034 1158
1035ecb_inline ecb_bool ecb_big_endian (void) ecb_const; 1159ecb_inline ecb_const ecb_bool ecb_big_endian (void);
1036ecb_inline ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11; } 1160ecb_inline ecb_const ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11223344; }
1037ecb_inline ecb_bool ecb_little_endian (void) ecb_const; 1161ecb_inline ecb_const ecb_bool ecb_little_endian (void);
1038ecb_inline ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44; } 1162ecb_inline ecb_const ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44332211; }
1039 1163
1040#if ECB_GCC_VERSION(3,0) || ECB_C99 1164#if ECB_GCC_VERSION(3,0) || ECB_C99
1041 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0)) 1165 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0))
1042#else 1166#else
1043 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n))) 1167 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n)))
1044#endif 1168#endif
1045 1169
1046#if __cplusplus 1170#if ECB_CPP
1047 template<typename T> 1171 template<typename T>
1048 static inline T ecb_div_rd (T val, T div) 1172 static inline T ecb_div_rd (T val, T div)
1049 { 1173 {
1050 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div; 1174 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div;
1051 } 1175 }
1068 } 1192 }
1069#else 1193#else
1070 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0])) 1194 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0]))
1071#endif 1195#endif
1072 1196
1197ecb_function_ ecb_const uint32_t ecb_binary16_to_binary32 (uint32_t x);
1198ecb_function_ ecb_const uint32_t
1199ecb_binary16_to_binary32 (uint32_t x)
1200{
1201 unsigned int s = (x & 0x8000) << (31 - 15);
1202 int e = (x >> 10) & 0x001f;
1203 unsigned int m = x & 0x03ff;
1204
1205 if (ecb_expect_false (e == 31))
1206 /* infinity or NaN */
1207 e = 255 - (127 - 15);
1208 else if (ecb_expect_false (!e))
1209 {
1210 if (ecb_expect_true (!m))
1211 /* zero, handled by code below by forcing e to 0 */
1212 e = 0 - (127 - 15);
1213 else
1214 {
1215 /* subnormal, renormalise */
1216 unsigned int s = 10 - ecb_ld32 (m);
1217
1218 m = (m << s) & 0x3ff; /* mask implicit bit */
1219 e -= s - 1;
1220 }
1221 }
1222
1223 /* e and m now are normalised, or zero, (or inf or nan) */
1224 e += 127 - 15;
1225
1226 return s | (e << 23) | (m << (23 - 10));
1227}
1228
1229ecb_function_ ecb_const uint16_t ecb_binary32_to_binary16 (uint32_t x);
1230ecb_function_ ecb_const uint16_t
1231ecb_binary32_to_binary16 (uint32_t x)
1232{
1233 unsigned int s = (x >> 16) & 0x00008000; /* sign bit, the easy part */
1234 unsigned int e = ((x >> 23) & 0x000000ff) - (127 - 15); /* the desired exponent */
1235 unsigned int m = x & 0x007fffff;
1236
1237 x &= 0x7fffffff;
1238
1239 /* if it's within range of binary16 normals, use fast path */
1240 if (ecb_expect_true (0x38800000 <= x && x <= 0x477fefff))
1241 {
1242 /* mantissa round-to-even */
1243 m += 0x00000fff + ((m >> (23 - 10)) & 1);
1244
1245 /* handle overflow */
1246 if (ecb_expect_false (m >= 0x00800000))
1247 {
1248 m >>= 1;
1249 e += 1;
1250 }
1251
1252 return s | (e << 10) | (m >> (23 - 10));
1253 }
1254
1255 /* handle large numbers and infinity */
1256 if (ecb_expect_true (0x477fefff < x && x <= 0x7f800000))
1257 return s | 0x7c00;
1258
1259 /* handle zero, subnormals and small numbers */
1260 if (ecb_expect_true (x < 0x38800000))
1261 {
1262 /* zero */
1263 if (ecb_expect_true (!x))
1264 return s;
1265
1266 /* handle subnormals */
1267
1268 /* too small, will be zero */
1269 if (e < (14 - 24)) /* might not be sharp, but is good enough */
1270 return s;
1271
1272 m |= 0x00800000; /* make implicit bit explicit */
1273
1274 /* very tricky - we need to round to the nearest e (+10) bit value */
1275 {
1276 unsigned int bits = 14 - e;
1277 unsigned int half = (1 << (bits - 1)) - 1;
1278 unsigned int even = (m >> bits) & 1;
1279
1280 /* if this overflows, we will end up with a normalised number */
1281 m = (m + half + even) >> bits;
1282 }
1283
1284 return s | m;
1285 }
1286
1287 /* handle NaNs, preserve leftmost nan bits, but make sure we don't turn them into infinities */
1288 m >>= 13;
1289
1290 return s | 0x7c00 | m | !m;
1291}
1292
1073/*******************************************************************************/ 1293/*******************************************************************************/
1074/* floating point stuff, can be disabled by defining ECB_NO_LIBM */ 1294/* floating point stuff, can be disabled by defining ECB_NO_LIBM */
1075 1295
1076/* basically, everything uses "ieee pure-endian" floating point numbers */ 1296/* basically, everything uses "ieee pure-endian" floating point numbers */
1077/* the only noteworthy exception is ancient armle, which uses order 43218765 */ 1297/* the only noteworthy exception is ancient armle, which uses order 43218765 */
1078#if 0 \ 1298#if 0 \
1079 || __i386 || __i386__ \ 1299 || __i386 || __i386__ \
1080 || __amd64 || __amd64__ || __x86_64 || __x86_64__ \ 1300 || ECB_GCC_AMD64 \
1081 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \ 1301 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \
1082 || defined __arm__ && defined __ARM_EABI__ \
1083 || defined __s390__ || defined __s390x__ \ 1302 || defined __s390__ || defined __s390x__ \
1084 || defined __mips__ \ 1303 || defined __mips__ \
1085 || defined __alpha__ \ 1304 || defined __alpha__ \
1086 || defined __hppa__ \ 1305 || defined __hppa__ \
1087 || defined __ia64__ \ 1306 || defined __ia64__ \
1088 || defined __m68k__ \ 1307 || defined __m68k__ \
1089 || defined __m88k__ \ 1308 || defined __m88k__ \
1090 || defined __sh__ \ 1309 || defined __sh__ \
1091 || defined _M_IX86 || defined _M_AMD64 || defined _M_IA64 \ 1310 || defined _M_IX86 || defined ECB_MSVC_AMD64 || defined _M_IA64 \
1092 || (defined __arm__ && (defined __ARM_EABI__ || defined __EABI__ || defined __VFP_FP__ || defined _WIN32_WCE || defined __ANDROID__)) 1311 || (defined __arm__ && (defined __ARM_EABI__ || defined __EABI__ || defined __VFP_FP__ || defined _WIN32_WCE || defined __ANDROID__)) \
1312 || defined __aarch64__
1093 #define ECB_STDFP 1 1313 #define ECB_STDFP 1
1094 #include <string.h> /* for memcpy */ 1314 #include <string.h> /* for memcpy */
1095#else 1315#else
1096 #define ECB_STDFP 0 1316 #define ECB_STDFP 0
1097#endif 1317#endif
1111 #define ECB_NAN NAN 1331 #define ECB_NAN NAN
1112 #else 1332 #else
1113 #define ECB_NAN ECB_INFINITY 1333 #define ECB_NAN ECB_INFINITY
1114 #endif 1334 #endif
1115 1335
1116 /* converts an ieee half/binary16 to a float */ 1336 #if ECB_C99 || _XOPEN_VERSION >= 600 || _POSIX_VERSION >= 200112L
1117 ecb_function_ float ecb_binary16_to_float (uint16_t x) ecb_const; 1337 #define ecb_ldexpf(x,e) ldexpf ((x), (e))
1118 ecb_function_ float 1338 #define ecb_frexpf(x,e) frexpf ((x), (e))
1119 ecb_binary16_to_float (uint16_t x) 1339 #else
1120 { 1340 #define ecb_ldexpf(x,e) (float) ldexp ((double) (x), (e))
1121 int e = (x >> 10) & 0x1f; 1341 #define ecb_frexpf(x,e) (float) frexp ((double) (x), (e))
1122 int m = x & 0x3ff; 1342 #endif
1123 float r;
1124
1125 if (!e ) r = ldexpf (m , -24);
1126 else if (e != 31) r = ldexpf (m + 0x400, e - 25);
1127 else if (m ) r = ECB_NAN;
1128 else r = ECB_INFINITY;
1129
1130 return x & 0x8000 ? -r : r;
1131 }
1132 1343
1133 /* convert a float to ieee single/binary32 */ 1344 /* convert a float to ieee single/binary32 */
1134 ecb_function_ uint32_t ecb_float_to_binary32 (float x) ecb_const; 1345 ecb_function_ ecb_const uint32_t ecb_float_to_binary32 (float x);
1135 ecb_function_ uint32_t 1346 ecb_function_ ecb_const uint32_t
1136 ecb_float_to_binary32 (float x) 1347 ecb_float_to_binary32 (float x)
1137 { 1348 {
1138 uint32_t r; 1349 uint32_t r;
1139 1350
1140 #if ECB_STDFP 1351 #if ECB_STDFP
1147 if (x == 0e0f ) return 0x00000000U; 1358 if (x == 0e0f ) return 0x00000000U;
1148 if (x > +3.40282346638528860e+38f) return 0x7f800000U; 1359 if (x > +3.40282346638528860e+38f) return 0x7f800000U;
1149 if (x < -3.40282346638528860e+38f) return 0xff800000U; 1360 if (x < -3.40282346638528860e+38f) return 0xff800000U;
1150 if (x != x ) return 0x7fbfffffU; 1361 if (x != x ) return 0x7fbfffffU;
1151 1362
1152 m = frexpf (x, &e) * 0x1000000U; 1363 m = ecb_frexpf (x, &e) * 0x1000000U;
1153 1364
1154 r = m & 0x80000000U; 1365 r = m & 0x80000000U;
1155 1366
1156 if (r) 1367 if (r)
1157 m = -m; 1368 m = -m;
1169 1380
1170 return r; 1381 return r;
1171 } 1382 }
1172 1383
1173 /* converts an ieee single/binary32 to a float */ 1384 /* converts an ieee single/binary32 to a float */
1174 ecb_function_ float ecb_binary32_to_float (uint32_t x) ecb_const; 1385 ecb_function_ ecb_const float ecb_binary32_to_float (uint32_t x);
1175 ecb_function_ float 1386 ecb_function_ ecb_const float
1176 ecb_binary32_to_float (uint32_t x) 1387 ecb_binary32_to_float (uint32_t x)
1177 { 1388 {
1178 float r; 1389 float r;
1179 1390
1180 #if ECB_STDFP 1391 #if ECB_STDFP
1190 x |= 0x800000U; 1401 x |= 0x800000U;
1191 else 1402 else
1192 e = 1; 1403 e = 1;
1193 1404
1194 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */ 1405 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */
1195 r = ldexpf (x * (0.5f / 0x800000U), e - 126); 1406 r = ecb_ldexpf (x * (0.5f / 0x800000U), e - 126);
1196 1407
1197 r = neg ? -r : r; 1408 r = neg ? -r : r;
1198 #endif 1409 #endif
1199 1410
1200 return r; 1411 return r;
1201 } 1412 }
1202 1413
1203 /* convert a double to ieee double/binary64 */ 1414 /* convert a double to ieee double/binary64 */
1204 ecb_function_ uint64_t ecb_double_to_binary64 (double x) ecb_const; 1415 ecb_function_ ecb_const uint64_t ecb_double_to_binary64 (double x);
1205 ecb_function_ uint64_t 1416 ecb_function_ ecb_const uint64_t
1206 ecb_double_to_binary64 (double x) 1417 ecb_double_to_binary64 (double x)
1207 { 1418 {
1208 uint64_t r; 1419 uint64_t r;
1209 1420
1210 #if ECB_STDFP 1421 #if ECB_STDFP
1239 1450
1240 return r; 1451 return r;
1241 } 1452 }
1242 1453
1243 /* converts an ieee double/binary64 to a double */ 1454 /* converts an ieee double/binary64 to a double */
1244 ecb_function_ double ecb_binary64_to_double (uint64_t x) ecb_const; 1455 ecb_function_ ecb_const double ecb_binary64_to_double (uint64_t x);
1245 ecb_function_ double 1456 ecb_function_ ecb_const double
1246 ecb_binary64_to_double (uint64_t x) 1457 ecb_binary64_to_double (uint64_t x)
1247 { 1458 {
1248 double r; 1459 double r;
1249 1460
1250 #if ECB_STDFP 1461 #if ECB_STDFP
1266 1477
1267 r = neg ? -r : r; 1478 r = neg ? -r : r;
1268 #endif 1479 #endif
1269 1480
1270 return r; 1481 return r;
1482 }
1483
1484 /* convert a float to ieee half/binary16 */
1485 ecb_function_ ecb_const uint16_t ecb_float_to_binary16 (float x);
1486 ecb_function_ ecb_const uint16_t
1487 ecb_float_to_binary16 (float x)
1488 {
1489 return ecb_binary32_to_binary16 (ecb_float_to_binary32 (x));
1490 }
1491
1492 /* convert an ieee half/binary16 to float */
1493 ecb_function_ ecb_const float ecb_binary16_to_float (uint16_t x);
1494 ecb_function_ ecb_const float
1495 ecb_binary16_to_float (uint16_t x)
1496 {
1497 return ecb_binary32_to_float (ecb_binary16_to_binary32 (x));
1271 } 1498 }
1272 1499
1273#endif 1500#endif
1274 1501
1275#endif 1502#endif
2586{ 2813{
2587 invoke_cb = invoke_pending_cb; 2814 invoke_cb = invoke_pending_cb;
2588} 2815}
2589 2816
2590void 2817void
2591ev_set_loop_release_cb (EV_P_ ev_loop_callback_nothrow release, ev_loop_callback_nothrow acquire) EV_THROW 2818ev_set_loop_release_cb (EV_P_ void (*release)(EV_P) EV_THROW, void (*acquire)(EV_P) EV_THROW) EV_THROW
2592{ 2819{
2593 release_cb = release; 2820 release_cb = release;
2594 acquire_cb = acquire; 2821 acquire_cb = acquire;
2595} 2822}
2596#endif 2823#endif
2822#if EV_USE_INOTIFY 3049#if EV_USE_INOTIFY
2823 infy_fork (EV_A); 3050 infy_fork (EV_A);
2824#endif 3051#endif
2825 3052
2826#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE 3053#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE
2827 if (ev_is_active (&pipe_w)) 3054 if (ev_is_active (&pipe_w) && postfork != 2)
2828 { 3055 {
2829 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */ 3056 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */
2830 3057
2831 ev_ref (EV_A); 3058 ev_ref (EV_A);
2832 ev_io_stop (EV_A_ &pipe_w); 3059 ev_io_stop (EV_A_ &pipe_w);

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines