ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/libev/ev.c
(Generate patch)

Comparing libev/ev.c (file contents):
Revision 1.469 by root, Fri Sep 5 16:21:19 2014 UTC vs.
Revision 1.479 by root, Sun Dec 20 01:31:17 2015 UTC

256# else 256# else
257# define EV_USE_CLOCK_SYSCALL 0 257# define EV_USE_CLOCK_SYSCALL 0
258# endif 258# endif
259#endif 259#endif
260 260
261#if !(_POSIX_TIMERS > 0)
262# ifndef EV_USE_MONOTONIC
263# define EV_USE_MONOTONIC 0
264# endif
265# ifndef EV_USE_REALTIME
266# define EV_USE_REALTIME 0
267# endif
268#endif
269
261#ifndef EV_USE_MONOTONIC 270#ifndef EV_USE_MONOTONIC
262# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0 271# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0
263# define EV_USE_MONOTONIC EV_FEATURE_OS 272# define EV_USE_MONOTONIC EV_FEATURE_OS
264# else 273# else
265# define EV_USE_MONOTONIC 0 274# define EV_USE_MONOTONIC 0
482/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */ 491/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */
483/* ECB.H BEGIN */ 492/* ECB.H BEGIN */
484/* 493/*
485 * libecb - http://software.schmorp.de/pkg/libecb 494 * libecb - http://software.schmorp.de/pkg/libecb
486 * 495 *
487 * Copyright (©) 2009-2014 Marc Alexander Lehmann <libecb@schmorp.de> 496 * Copyright (©) 2009-2015 Marc Alexander Lehmann <libecb@schmorp.de>
488 * Copyright (©) 2011 Emanuele Giaquinta 497 * Copyright (©) 2011 Emanuele Giaquinta
489 * All rights reserved. 498 * All rights reserved.
490 * 499 *
491 * Redistribution and use in source and binary forms, with or without modifica- 500 * Redistribution and use in source and binary forms, with or without modifica-
492 * tion, are permitted provided that the following conditions are met: 501 * tion, are permitted provided that the following conditions are met:
523 532
524#ifndef ECB_H 533#ifndef ECB_H
525#define ECB_H 534#define ECB_H
526 535
527/* 16 bits major, 16 bits minor */ 536/* 16 bits major, 16 bits minor */
528#define ECB_VERSION 0x00010003 537#define ECB_VERSION 0x00010005
529 538
530#ifdef _WIN32 539#ifdef _WIN32
531 typedef signed char int8_t; 540 typedef signed char int8_t;
532 typedef unsigned char uint8_t; 541 typedef unsigned char uint8_t;
533 typedef signed short int16_t; 542 typedef signed short int16_t;
550 typedef uint32_t uintptr_t; 559 typedef uint32_t uintptr_t;
551 typedef int32_t intptr_t; 560 typedef int32_t intptr_t;
552 #endif 561 #endif
553#else 562#else
554 #include <inttypes.h> 563 #include <inttypes.h>
555 #if UINTMAX_MAX > 0xffffffffU 564 #if (defined INTPTR_MAX ? INTPTR_MAX : ULONG_MAX) > 0xffffffffU
556 #define ECB_PTRSIZE 8 565 #define ECB_PTRSIZE 8
557 #else 566 #else
558 #define ECB_PTRSIZE 4 567 #define ECB_PTRSIZE 4
559 #endif 568 #endif
560#endif 569#endif
561 570
571#define ECB_GCC_AMD64 (__amd64 || __amd64__ || __x86_64 || __x86_64__)
572#define ECB_MSVC_AMD64 (_M_AMD64 || _M_X64)
573
562/* work around x32 idiocy by defining proper macros */ 574/* work around x32 idiocy by defining proper macros */
563#if __amd64 || __x86_64 || _M_AMD64 || _M_X64 575#if ECB_GCC_AMD64 || ECB_MSVC_AMD64
564 #if _ILP32 576 #if _ILP32
565 #define ECB_AMD64_X32 1 577 #define ECB_AMD64_X32 1
566 #else 578 #else
567 #define ECB_AMD64 1 579 #define ECB_AMD64 1
568 #endif 580 #endif
573 * causing enormous grief in return for some better fake benchmark numbers. 585 * causing enormous grief in return for some better fake benchmark numbers.
574 * or so. 586 * or so.
575 * we try to detect these and simply assume they are not gcc - if they have 587 * we try to detect these and simply assume they are not gcc - if they have
576 * an issue with that they should have done it right in the first place. 588 * an issue with that they should have done it right in the first place.
577 */ 589 */
578#ifndef ECB_GCC_VERSION
579 #if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__ 590#if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__
580 #define ECB_GCC_VERSION(major,minor) 0 591 #define ECB_GCC_VERSION(major,minor) 0
581 #else 592#else
582 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor))) 593 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor)))
583 #endif 594#endif
595
596#define ECB_CLANG_VERSION(major,minor) (__clang_major__ > (major) || (__clang_major__ == (major) && __clang_minor__ >= (minor)))
597
598#if __clang__ && defined __has_builtin
599 #define ECB_CLANG_BUILTIN(x) __has_builtin (x)
600#else
601 #define ECB_CLANG_BUILTIN(x) 0
602#endif
603
604#if __clang__ && defined __has_extension
605 #define ECB_CLANG_EXTENSION(x) __has_extension (x)
606#else
607 #define ECB_CLANG_EXTENSION(x) 0
584#endif 608#endif
585 609
586#define ECB_CPP (__cplusplus+0) 610#define ECB_CPP (__cplusplus+0)
587#define ECB_CPP11 (__cplusplus >= 201103L) 611#define ECB_CPP11 (__cplusplus >= 201103L)
588 612
616 #define ECB_NO_SMP 1 640 #define ECB_NO_SMP 1
617#endif 641#endif
618 642
619#if ECB_NO_SMP 643#if ECB_NO_SMP
620 #define ECB_MEMORY_FENCE do { } while (0) 644 #define ECB_MEMORY_FENCE do { } while (0)
645#endif
646
647/* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/compiler_ref/compiler_builtins.html */
648#if __xlC__ && ECB_CPP
649 #include <builtins.h>
650#endif
651
652#if 1400 <= _MSC_VER
653 #include <intrin.h> /* fence functions _ReadBarrier, also bit search functions _BitScanReverse */
621#endif 654#endif
622 655
623#ifndef ECB_MEMORY_FENCE 656#ifndef ECB_MEMORY_FENCE
624 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110 657 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110
625 #if __i386 || __i386__ 658 #if __i386 || __i386__
626 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory") 659 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory")
627 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory") 660 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
628 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 661 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
629 #elif __amd64 || __amd64__ || __x86_64 || __x86_64__ 662 #elif ECB_GCC_AMD64
630 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory") 663 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory")
631 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory") 664 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
632 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 665 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
633 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ 666 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__
634 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory") 667 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory")
668 #elif defined __ARM_ARCH_2__ \
669 || defined __ARM_ARCH_3__ || defined __ARM_ARCH_3M__ \
670 || defined __ARM_ARCH_4__ || defined __ARM_ARCH_4T__ \
671 || defined __ARM_ARCH_5__ || defined __ARM_ARCH_5E__ \
672 || defined __ARM_ARCH_5T__ || defined __ARM_ARCH_5TE__ \
673 || defined __ARM_ARCH_5TEJ__
674 /* should not need any, unless running old code on newer cpu - arm doesn't support that */
635 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \ 675 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \
636 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ 676 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ \
677 || defined __ARM_ARCH_6T2__
637 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory") 678 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory")
638 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \ 679 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \
639 || defined __ARM_ARCH_7M__ || defined __ARM_ARCH_7R__ 680 || defined __ARM_ARCH_7R__ || defined __ARM_ARCH_7M__
640 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory") 681 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory")
641 #elif __aarch64__ 682 #elif __aarch64__
642 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb ish" : : : "memory") 683 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb ish" : : : "memory")
643 #elif (__sparc || __sparc__) && !__sparcv8 684 #elif (__sparc || __sparc__) && !(__sparc_v8__ || defined __sparcv8)
644 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory") 685 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory")
645 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory") 686 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory")
646 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore") 687 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore")
647 #elif defined __s390__ || defined __s390x__ 688 #elif defined __s390__ || defined __s390x__
648 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory") 689 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory")
672 /* see comment below (stdatomic.h) about the C11 memory model. */ 713 /* see comment below (stdatomic.h) about the C11 memory model. */
673 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST) 714 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST)
674 #define ECB_MEMORY_FENCE_ACQUIRE __atomic_thread_fence (__ATOMIC_ACQUIRE) 715 #define ECB_MEMORY_FENCE_ACQUIRE __atomic_thread_fence (__ATOMIC_ACQUIRE)
675 #define ECB_MEMORY_FENCE_RELEASE __atomic_thread_fence (__ATOMIC_RELEASE) 716 #define ECB_MEMORY_FENCE_RELEASE __atomic_thread_fence (__ATOMIC_RELEASE)
676 717
677 /* The __has_feature syntax from clang is so misdesigned that we cannot use it 718 #elif ECB_CLANG_EXTENSION(c_atomic)
678 * without risking compile time errors with other compilers. We *could*
679 * define our own ecb_clang_has_feature, but I just can't be bothered to work
680 * around this shit time and again.
681 * #elif defined __clang && __has_feature (cxx_atomic)
682 * // see comment below (stdatomic.h) about the C11 memory model. 719 /* see comment below (stdatomic.h) about the C11 memory model. */
683 * #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST) 720 #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST)
684 * #define ECB_MEMORY_FENCE_ACQUIRE __c11_atomic_thread_fence (__ATOMIC_ACQUIRE) 721 #define ECB_MEMORY_FENCE_ACQUIRE __c11_atomic_thread_fence (__ATOMIC_ACQUIRE)
685 * #define ECB_MEMORY_FENCE_RELEASE __c11_atomic_thread_fence (__ATOMIC_RELEASE) 722 #define ECB_MEMORY_FENCE_RELEASE __c11_atomic_thread_fence (__ATOMIC_RELEASE)
686 */
687 723
688 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__ 724 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__
689 #define ECB_MEMORY_FENCE __sync_synchronize () 725 #define ECB_MEMORY_FENCE __sync_synchronize ()
690 #elif _MSC_VER >= 1500 /* VC++ 2008 */ 726 #elif _MSC_VER >= 1500 /* VC++ 2008 */
691 /* apparently, microsoft broke all the memory barrier stuff in Visual Studio 2008... */ 727 /* apparently, microsoft broke all the memory barrier stuff in Visual Studio 2008... */
754 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE 790 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE
755#endif 791#endif
756 792
757/*****************************************************************************/ 793/*****************************************************************************/
758 794
759#if __cplusplus 795#if ECB_CPP
760 #define ecb_inline static inline 796 #define ecb_inline static inline
761#elif ECB_GCC_VERSION(2,5) 797#elif ECB_GCC_VERSION(2,5)
762 #define ecb_inline static __inline__ 798 #define ecb_inline static __inline__
763#elif ECB_C99 799#elif ECB_C99
764 #define ecb_inline static inline 800 #define ecb_inline static inline
778 814
779#define ECB_CONCAT_(a, b) a ## b 815#define ECB_CONCAT_(a, b) a ## b
780#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b) 816#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b)
781#define ECB_STRINGIFY_(a) # a 817#define ECB_STRINGIFY_(a) # a
782#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a) 818#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a)
819#define ECB_STRINGIFY_EXPR(expr) ((expr), ECB_STRINGIFY_ (expr))
783 820
784#define ecb_function_ ecb_inline 821#define ecb_function_ ecb_inline
785 822
786#if ECB_GCC_VERSION(3,1) 823#if ECB_GCC_VERSION(3,1) || ECB_CLANG_VERSION(2,8)
787 #define ecb_attribute(attrlist) __attribute__(attrlist) 824 #define ecb_attribute(attrlist) __attribute__ (attrlist)
825#else
826 #define ecb_attribute(attrlist)
827#endif
828
829#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_constant_p)
788 #define ecb_is_constant(expr) __builtin_constant_p (expr) 830 #define ecb_is_constant(expr) __builtin_constant_p (expr)
789 #define ecb_expect(expr,value) __builtin_expect ((expr),(value))
790 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality)
791#else 831#else
792 #define ecb_attribute(attrlist)
793
794 /* possible C11 impl for integral types 832 /* possible C11 impl for integral types
795 typedef struct ecb_is_constant_struct ecb_is_constant_struct; 833 typedef struct ecb_is_constant_struct ecb_is_constant_struct;
796 #define ecb_is_constant(expr) _Generic ((1 ? (struct ecb_is_constant_struct *)0 : (void *)((expr) - (expr)), ecb_is_constant_struct *: 0, default: 1)) */ 834 #define ecb_is_constant(expr) _Generic ((1 ? (struct ecb_is_constant_struct *)0 : (void *)((expr) - (expr)), ecb_is_constant_struct *: 0, default: 1)) */
797 835
798 #define ecb_is_constant(expr) 0 836 #define ecb_is_constant(expr) 0
837#endif
838
839#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_expect)
840 #define ecb_expect(expr,value) __builtin_expect ((expr),(value))
841#else
799 #define ecb_expect(expr,value) (expr) 842 #define ecb_expect(expr,value) (expr)
843#endif
844
845#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_prefetch)
846 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality)
847#else
800 #define ecb_prefetch(addr,rw,locality) 848 #define ecb_prefetch(addr,rw,locality)
801#endif 849#endif
802 850
803/* no emulation for ecb_decltype */ 851/* no emulation for ecb_decltype */
804#if ECB_GCC_VERSION(4,5) 852#if ECB_CPP11
853 // older implementations might have problems with decltype(x)::type, work around it
854 template<class T> struct ecb_decltype_t { typedef T type; };
805 #define ecb_decltype(x) __decltype(x) 855 #define ecb_decltype(x) ecb_decltype_t<decltype (x)>::type
806#elif ECB_GCC_VERSION(3,0) 856#elif ECB_GCC_VERSION(3,0) || ECB_CLANG_VERSION(2,8)
807 #define ecb_decltype(x) __typeof(x) 857 #define ecb_decltype(x) __typeof__ (x)
808#endif 858#endif
809 859
810#if _MSC_VER >= 1300 860#if _MSC_VER >= 1300
811 #define ecb_deprecated __declspec(deprecated) 861 #define ecb_deprecated __declspec (deprecated)
812#else 862#else
813 #define ecb_deprecated ecb_attribute ((__deprecated__)) 863 #define ecb_deprecated ecb_attribute ((__deprecated__))
814#endif 864#endif
815 865
866#if _MSC_VER >= 1500
867 #define ecb_deprecated_message(msg) __declspec (deprecated (msg))
868#elif ECB_GCC_VERSION(4,5)
869 #define ecb_deprecated_message(msg) ecb_attribute ((__deprecated__ (msg))
870#else
871 #define ecb_deprecated_message(msg) ecb_deprecated
872#endif
873
874#if _MSC_VER >= 1400
875 #define ecb_noinline __declspec (noinline)
876#else
816#define ecb_noinline ecb_attribute ((__noinline__)) 877 #define ecb_noinline ecb_attribute ((__noinline__))
878#endif
879
817#define ecb_unused ecb_attribute ((__unused__)) 880#define ecb_unused ecb_attribute ((__unused__))
818#define ecb_const ecb_attribute ((__const__)) 881#define ecb_const ecb_attribute ((__const__))
819#define ecb_pure ecb_attribute ((__pure__)) 882#define ecb_pure ecb_attribute ((__pure__))
820 883
821/* http://msdn.microsoft.com/en-us/library/k6ktzx3s.aspx __declspec(noreturn) */ 884#if ECB_C11 || __IBMC_NORETURN
822#if ECB_C11 885 /* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/language_ref/noreturn.html */
823 #define ecb_noreturn _Noreturn 886 #define ecb_noreturn _Noreturn
887#elif ECB_CPP11
888 #define ecb_noreturn [[noreturn]]
889#elif _MSC_VER >= 1200
890 /* http://msdn.microsoft.com/en-us/library/k6ktzx3s.aspx */
891 #define ecb_noreturn __declspec (noreturn)
824#else 892#else
825 #define ecb_noreturn ecb_attribute ((__noreturn__)) 893 #define ecb_noreturn ecb_attribute ((__noreturn__))
826#endif 894#endif
827 895
828#if ECB_GCC_VERSION(4,3) 896#if ECB_GCC_VERSION(4,3)
843/* for compatibility to the rest of the world */ 911/* for compatibility to the rest of the world */
844#define ecb_likely(expr) ecb_expect_true (expr) 912#define ecb_likely(expr) ecb_expect_true (expr)
845#define ecb_unlikely(expr) ecb_expect_false (expr) 913#define ecb_unlikely(expr) ecb_expect_false (expr)
846 914
847/* count trailing zero bits and count # of one bits */ 915/* count trailing zero bits and count # of one bits */
848#if ECB_GCC_VERSION(3,4) 916#if ECB_GCC_VERSION(3,4) \
917 || (ECB_CLANG_BUILTIN(__builtin_clz) && ECB_CLANG_BUILTIN(__builtin_clzll) \
918 && ECB_CLANG_BUILTIN(__builtin_ctz) && ECB_CLANG_BUILTIN(__builtin_ctzll) \
919 && ECB_CLANG_BUILTIN(__builtin_popcount))
849 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */ 920 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */
850 #define ecb_ld32(x) (__builtin_clz (x) ^ 31) 921 #define ecb_ld32(x) (__builtin_clz (x) ^ 31)
851 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63) 922 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63)
852 #define ecb_ctz32(x) __builtin_ctz (x) 923 #define ecb_ctz32(x) __builtin_ctz (x)
853 #define ecb_ctz64(x) __builtin_ctzll (x) 924 #define ecb_ctz64(x) __builtin_ctzll (x)
854 #define ecb_popcount32(x) __builtin_popcount (x) 925 #define ecb_popcount32(x) __builtin_popcount (x)
855 /* no popcountll */ 926 /* no popcountll */
856#else 927#else
857 ecb_function_ int ecb_ctz32 (uint32_t x) ecb_const; 928 ecb_function_ ecb_const int ecb_ctz32 (uint32_t x);
858 ecb_function_ int 929 ecb_function_ ecb_const int
859 ecb_ctz32 (uint32_t x) 930 ecb_ctz32 (uint32_t x)
860 { 931 {
932#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
933 unsigned long r;
934 _BitScanForward (&r, x);
935 return (int)r;
936#else
861 int r = 0; 937 int r = 0;
862 938
863 x &= ~x + 1; /* this isolates the lowest bit */ 939 x &= ~x + 1; /* this isolates the lowest bit */
864 940
865#if ECB_branchless_on_i386 941#if ECB_branchless_on_i386
875 if (x & 0xff00ff00) r += 8; 951 if (x & 0xff00ff00) r += 8;
876 if (x & 0xffff0000) r += 16; 952 if (x & 0xffff0000) r += 16;
877#endif 953#endif
878 954
879 return r; 955 return r;
956#endif
880 } 957 }
881 958
882 ecb_function_ int ecb_ctz64 (uint64_t x) ecb_const; 959 ecb_function_ ecb_const int ecb_ctz64 (uint64_t x);
883 ecb_function_ int 960 ecb_function_ ecb_const int
884 ecb_ctz64 (uint64_t x) 961 ecb_ctz64 (uint64_t x)
885 { 962 {
963#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
964 unsigned long r;
965 _BitScanForward64 (&r, x);
966 return (int)r;
967#else
886 int shift = x & 0xffffffffU ? 0 : 32; 968 int shift = x & 0xffffffff ? 0 : 32;
887 return ecb_ctz32 (x >> shift) + shift; 969 return ecb_ctz32 (x >> shift) + shift;
970#endif
888 } 971 }
889 972
890 ecb_function_ int ecb_popcount32 (uint32_t x) ecb_const; 973 ecb_function_ ecb_const int ecb_popcount32 (uint32_t x);
891 ecb_function_ int 974 ecb_function_ ecb_const int
892 ecb_popcount32 (uint32_t x) 975 ecb_popcount32 (uint32_t x)
893 { 976 {
894 x -= (x >> 1) & 0x55555555; 977 x -= (x >> 1) & 0x55555555;
895 x = ((x >> 2) & 0x33333333) + (x & 0x33333333); 978 x = ((x >> 2) & 0x33333333) + (x & 0x33333333);
896 x = ((x >> 4) + x) & 0x0f0f0f0f; 979 x = ((x >> 4) + x) & 0x0f0f0f0f;
897 x *= 0x01010101; 980 x *= 0x01010101;
898 981
899 return x >> 24; 982 return x >> 24;
900 } 983 }
901 984
902 ecb_function_ int ecb_ld32 (uint32_t x) ecb_const; 985 ecb_function_ ecb_const int ecb_ld32 (uint32_t x);
903 ecb_function_ int ecb_ld32 (uint32_t x) 986 ecb_function_ ecb_const int ecb_ld32 (uint32_t x)
904 { 987 {
988#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
989 unsigned long r;
990 _BitScanReverse (&r, x);
991 return (int)r;
992#else
905 int r = 0; 993 int r = 0;
906 994
907 if (x >> 16) { x >>= 16; r += 16; } 995 if (x >> 16) { x >>= 16; r += 16; }
908 if (x >> 8) { x >>= 8; r += 8; } 996 if (x >> 8) { x >>= 8; r += 8; }
909 if (x >> 4) { x >>= 4; r += 4; } 997 if (x >> 4) { x >>= 4; r += 4; }
910 if (x >> 2) { x >>= 2; r += 2; } 998 if (x >> 2) { x >>= 2; r += 2; }
911 if (x >> 1) { r += 1; } 999 if (x >> 1) { r += 1; }
912 1000
913 return r; 1001 return r;
1002#endif
914 } 1003 }
915 1004
916 ecb_function_ int ecb_ld64 (uint64_t x) ecb_const; 1005 ecb_function_ ecb_const int ecb_ld64 (uint64_t x);
917 ecb_function_ int ecb_ld64 (uint64_t x) 1006 ecb_function_ ecb_const int ecb_ld64 (uint64_t x)
918 { 1007 {
1008#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
1009 unsigned long r;
1010 _BitScanReverse64 (&r, x);
1011 return (int)r;
1012#else
919 int r = 0; 1013 int r = 0;
920 1014
921 if (x >> 32) { x >>= 32; r += 32; } 1015 if (x >> 32) { x >>= 32; r += 32; }
922 1016
923 return r + ecb_ld32 (x); 1017 return r + ecb_ld32 (x);
1018#endif
924 } 1019 }
925#endif 1020#endif
926 1021
927ecb_function_ ecb_bool ecb_is_pot32 (uint32_t x) ecb_const; 1022ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x);
928ecb_function_ ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); } 1023ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); }
929ecb_function_ ecb_bool ecb_is_pot64 (uint64_t x) ecb_const; 1024ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x);
930ecb_function_ ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); } 1025ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); }
931 1026
932ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) ecb_const; 1027ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x);
933ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) 1028ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x)
934{ 1029{
935 return ( (x * 0x0802U & 0x22110U) 1030 return ( (x * 0x0802U & 0x22110U)
936 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16; 1031 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16;
937} 1032}
938 1033
939ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) ecb_const; 1034ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x);
940ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) 1035ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x)
941{ 1036{
942 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1); 1037 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1);
943 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2); 1038 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2);
944 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4); 1039 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4);
945 x = ( x >> 8 ) | ( x << 8); 1040 x = ( x >> 8 ) | ( x << 8);
946 1041
947 return x; 1042 return x;
948} 1043}
949 1044
950ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) ecb_const; 1045ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x);
951ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) 1046ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x)
952{ 1047{
953 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1); 1048 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1);
954 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2); 1049 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2);
955 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4); 1050 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4);
956 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8); 1051 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8);
959 return x; 1054 return x;
960} 1055}
961 1056
962/* popcount64 is only available on 64 bit cpus as gcc builtin */ 1057/* popcount64 is only available on 64 bit cpus as gcc builtin */
963/* so for this version we are lazy */ 1058/* so for this version we are lazy */
964ecb_function_ int ecb_popcount64 (uint64_t x) ecb_const; 1059ecb_function_ ecb_const int ecb_popcount64 (uint64_t x);
965ecb_function_ int 1060ecb_function_ ecb_const int
966ecb_popcount64 (uint64_t x) 1061ecb_popcount64 (uint64_t x)
967{ 1062{
968 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32); 1063 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32);
969} 1064}
970 1065
971ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) ecb_const; 1066ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count);
972ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) ecb_const; 1067ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count);
973ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) ecb_const; 1068ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count);
974ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) ecb_const; 1069ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count);
975ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) ecb_const; 1070ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count);
976ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) ecb_const; 1071ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count);
977ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) ecb_const; 1072ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count);
978ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) ecb_const; 1073ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count);
979 1074
980ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); } 1075ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); }
981ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); } 1076ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); }
982ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); } 1077ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); }
983ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); } 1078ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); }
984ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); } 1079ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); }
985ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); } 1080ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); }
986ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); } 1081ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); }
987ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); } 1082ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); }
988 1083
989#if ECB_GCC_VERSION(4,3) 1084#if ECB_GCC_VERSION(4,3) || (ECB_CLANG_BUILTIN(__builtin_bswap32) && ECB_CLANG_BUILTIN(__builtin_bswap64))
1085 #if ECB_GCC_VERSION(4,8) || ECB_CLANG_BUILTIN(__builtin_bswap16)
1086 #define ecb_bswap16(x) __builtin_bswap16 (x)
1087 #else
990 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16) 1088 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16)
1089 #endif
991 #define ecb_bswap32(x) __builtin_bswap32 (x) 1090 #define ecb_bswap32(x) __builtin_bswap32 (x)
992 #define ecb_bswap64(x) __builtin_bswap64 (x) 1091 #define ecb_bswap64(x) __builtin_bswap64 (x)
1092#elif _MSC_VER
1093 #include <stdlib.h>
1094 #define ecb_bswap16(x) ((uint16_t)_byteswap_ushort ((uint16_t)(x)))
1095 #define ecb_bswap32(x) ((uint32_t)_byteswap_ulong ((uint32_t)(x)))
1096 #define ecb_bswap64(x) ((uint64_t)_byteswap_uint64 ((uint64_t)(x)))
993#else 1097#else
994 ecb_function_ uint16_t ecb_bswap16 (uint16_t x) ecb_const; 1098 ecb_function_ ecb_const uint16_t ecb_bswap16 (uint16_t x);
995 ecb_function_ uint16_t 1099 ecb_function_ ecb_const uint16_t
996 ecb_bswap16 (uint16_t x) 1100 ecb_bswap16 (uint16_t x)
997 { 1101 {
998 return ecb_rotl16 (x, 8); 1102 return ecb_rotl16 (x, 8);
999 } 1103 }
1000 1104
1001 ecb_function_ uint32_t ecb_bswap32 (uint32_t x) ecb_const; 1105 ecb_function_ ecb_const uint32_t ecb_bswap32 (uint32_t x);
1002 ecb_function_ uint32_t 1106 ecb_function_ ecb_const uint32_t
1003 ecb_bswap32 (uint32_t x) 1107 ecb_bswap32 (uint32_t x)
1004 { 1108 {
1005 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16); 1109 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16);
1006 } 1110 }
1007 1111
1008 ecb_function_ uint64_t ecb_bswap64 (uint64_t x) ecb_const; 1112 ecb_function_ ecb_const uint64_t ecb_bswap64 (uint64_t x);
1009 ecb_function_ uint64_t 1113 ecb_function_ ecb_const uint64_t
1010 ecb_bswap64 (uint64_t x) 1114 ecb_bswap64 (uint64_t x)
1011 { 1115 {
1012 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32); 1116 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32);
1013 } 1117 }
1014#endif 1118#endif
1015 1119
1016#if ECB_GCC_VERSION(4,5) 1120#if ECB_GCC_VERSION(4,5) || ECB_CLANG_BUILTIN(__builtin_unreachable)
1017 #define ecb_unreachable() __builtin_unreachable () 1121 #define ecb_unreachable() __builtin_unreachable ()
1018#else 1122#else
1019 /* this seems to work fine, but gcc always emits a warning for it :/ */ 1123 /* this seems to work fine, but gcc always emits a warning for it :/ */
1020 ecb_inline void ecb_unreachable (void) ecb_noreturn; 1124 ecb_inline ecb_noreturn void ecb_unreachable (void);
1021 ecb_inline void ecb_unreachable (void) { } 1125 ecb_inline ecb_noreturn void ecb_unreachable (void) { }
1022#endif 1126#endif
1023 1127
1024/* try to tell the compiler that some condition is definitely true */ 1128/* try to tell the compiler that some condition is definitely true */
1025#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0 1129#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0
1026 1130
1027ecb_inline unsigned char ecb_byteorder_helper (void) ecb_const; 1131ecb_inline ecb_const uint32_t ecb_byteorder_helper (void);
1028ecb_inline unsigned char 1132ecb_inline ecb_const uint32_t
1029ecb_byteorder_helper (void) 1133ecb_byteorder_helper (void)
1030{ 1134{
1031 /* the union code still generates code under pressure in gcc, */ 1135 /* the union code still generates code under pressure in gcc, */
1032 /* but less than using pointers, and always seems to */ 1136 /* but less than using pointers, and always seems to */
1033 /* successfully return a constant. */ 1137 /* successfully return a constant. */
1034 /* the reason why we have this horrible preprocessor mess */ 1138 /* the reason why we have this horrible preprocessor mess */
1035 /* is to avoid it in all cases, at least on common architectures */ 1139 /* is to avoid it in all cases, at least on common architectures */
1036 /* or when using a recent enough gcc version (>= 4.6) */ 1140 /* or when using a recent enough gcc version (>= 4.6) */
1037#if __i386 || __i386__ || _M_X86 || __amd64 || __amd64__ || _M_X64
1038 return 0x44;
1039#elif __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__ 1141#if (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__) \
1142 || ((__i386 || __i386__ || _M_IX86 || ECB_GCC_AMD64 || ECB_MSVC_AMD64) && !__VOS__)
1143 #define ECB_LITTLE_ENDIAN 1
1040 return 0x44; 1144 return 0x44332211;
1041#elif __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__ 1145#elif (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__) \
1146 || ((__AARCH64EB__ || __MIPSEB__ || __ARMEB__) && !__VOS__)
1147 #define ECB_BIG_ENDIAN 1
1042 return 0x11; 1148 return 0x11223344;
1043#else 1149#else
1044 union 1150 union
1045 { 1151 {
1152 uint8_t c[4];
1046 uint32_t i; 1153 uint32_t u;
1047 uint8_t c;
1048 } u = { 0x11223344 }; 1154 } u = { 0x11, 0x22, 0x33, 0x44 };
1049 return u.c; 1155 return u.u;
1050#endif 1156#endif
1051} 1157}
1052 1158
1053ecb_inline ecb_bool ecb_big_endian (void) ecb_const; 1159ecb_inline ecb_const ecb_bool ecb_big_endian (void);
1054ecb_inline ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11; } 1160ecb_inline ecb_const ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11223344; }
1055ecb_inline ecb_bool ecb_little_endian (void) ecb_const; 1161ecb_inline ecb_const ecb_bool ecb_little_endian (void);
1056ecb_inline ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44; } 1162ecb_inline ecb_const ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44332211; }
1057 1163
1058#if ECB_GCC_VERSION(3,0) || ECB_C99 1164#if ECB_GCC_VERSION(3,0) || ECB_C99
1059 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0)) 1165 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0))
1060#else 1166#else
1061 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n))) 1167 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n)))
1062#endif 1168#endif
1063 1169
1064#if __cplusplus 1170#if ECB_CPP
1065 template<typename T> 1171 template<typename T>
1066 static inline T ecb_div_rd (T val, T div) 1172 static inline T ecb_div_rd (T val, T div)
1067 { 1173 {
1068 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div; 1174 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div;
1069 } 1175 }
1086 } 1192 }
1087#else 1193#else
1088 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0])) 1194 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0]))
1089#endif 1195#endif
1090 1196
1197ecb_function_ ecb_const uint32_t ecb_binary16_to_binary32 (uint32_t x);
1198ecb_function_ ecb_const uint32_t
1199ecb_binary16_to_binary32 (uint32_t x)
1200{
1201 unsigned int s = (x & 0x8000) << (31 - 15);
1202 int e = (x >> 10) & 0x001f;
1203 unsigned int m = x & 0x03ff;
1204
1205 if (ecb_expect_false (e == 31))
1206 /* infinity or NaN */
1207 e = 255 - (127 - 15);
1208 else if (ecb_expect_false (!e))
1209 {
1210 if (ecb_expect_true (!m))
1211 /* zero, handled by code below by forcing e to 0 */
1212 e = 0 - (127 - 15);
1213 else
1214 {
1215 /* subnormal, renormalise */
1216 unsigned int s = 10 - ecb_ld32 (m);
1217
1218 m = (m << s) & 0x3ff; /* mask implicit bit */
1219 e -= s - 1;
1220 }
1221 }
1222
1223 /* e and m now are normalised, or zero, (or inf or nan) */
1224 e += 127 - 15;
1225
1226 return s | (e << 23) | (m << (23 - 10));
1227}
1228
1229ecb_function_ ecb_const uint16_t ecb_binary32_to_binary16 (uint32_t x);
1230ecb_function_ ecb_const uint16_t
1231ecb_binary32_to_binary16 (uint32_t x)
1232{
1233 unsigned int s = (x >> 16) & 0x00008000; /* sign bit, the easy part */
1234 unsigned int e = ((x >> 23) & 0x000000ff) - (127 - 15); /* the desired exponent */
1235 unsigned int m = x & 0x007fffff;
1236
1237 x &= 0x7fffffff;
1238
1239 /* if it's within range of binary16 normals, use fast path */
1240 if (ecb_expect_true (0x38800000 <= x && x <= 0x477fefff))
1241 {
1242 /* mantissa round-to-even */
1243 m += 0x00000fff + ((m >> (23 - 10)) & 1);
1244
1245 /* handle overflow */
1246 if (ecb_expect_false (m >= 0x00800000))
1247 {
1248 m >>= 1;
1249 e += 1;
1250 }
1251
1252 return s | (e << 10) | (m >> (23 - 10));
1253 }
1254
1255 /* handle large numbers and infinity */
1256 if (ecb_expect_true (0x477fefff < x && x <= 0x7f800000))
1257 return s | 0x7c00;
1258
1259 /* handle zero, subnormals and small numbers */
1260 if (ecb_expect_true (x < 0x38800000))
1261 {
1262 /* zero */
1263 if (ecb_expect_true (!x))
1264 return s;
1265
1266 /* handle subnormals */
1267
1268 /* too small, will be zero */
1269 if (e < (14 - 24)) /* might not be sharp, but is good enough */
1270 return s;
1271
1272 m |= 0x00800000; /* make implicit bit explicit */
1273
1274 /* very tricky - we need to round to the nearest e (+10) bit value */
1275 {
1276 unsigned int bits = 14 - e;
1277 unsigned int half = (1 << (bits - 1)) - 1;
1278 unsigned int even = (m >> bits) & 1;
1279
1280 /* if this overflows, we will end up with a normalised number */
1281 m = (m + half + even) >> bits;
1282 }
1283
1284 return s | m;
1285 }
1286
1287 /* handle NaNs, preserve leftmost nan bits, but make sure we don't turn them into infinities */
1288 m >>= 13;
1289
1290 return s | 0x7c00 | m | !m;
1291}
1292
1091/*******************************************************************************/ 1293/*******************************************************************************/
1092/* floating point stuff, can be disabled by defining ECB_NO_LIBM */ 1294/* floating point stuff, can be disabled by defining ECB_NO_LIBM */
1093 1295
1094/* basically, everything uses "ieee pure-endian" floating point numbers */ 1296/* basically, everything uses "ieee pure-endian" floating point numbers */
1095/* the only noteworthy exception is ancient armle, which uses order 43218765 */ 1297/* the only noteworthy exception is ancient armle, which uses order 43218765 */
1096#if 0 \ 1298#if 0 \
1097 || __i386 || __i386__ \ 1299 || __i386 || __i386__ \
1098 || __amd64 || __amd64__ || __x86_64 || __x86_64__ \ 1300 || ECB_GCC_AMD64 \
1099 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \ 1301 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \
1100 || defined __s390__ || defined __s390x__ \ 1302 || defined __s390__ || defined __s390x__ \
1101 || defined __mips__ \ 1303 || defined __mips__ \
1102 || defined __alpha__ \ 1304 || defined __alpha__ \
1103 || defined __hppa__ \ 1305 || defined __hppa__ \
1104 || defined __ia64__ \ 1306 || defined __ia64__ \
1105 || defined __m68k__ \ 1307 || defined __m68k__ \
1106 || defined __m88k__ \ 1308 || defined __m88k__ \
1107 || defined __sh__ \ 1309 || defined __sh__ \
1108 || defined _M_IX86 || defined _M_AMD64 || defined _M_IA64 \ 1310 || defined _M_IX86 || defined ECB_MSVC_AMD64 || defined _M_IA64 \
1109 || (defined __arm__ && (defined __ARM_EABI__ || defined __EABI__ || defined __VFP_FP__ || defined _WIN32_WCE || defined __ANDROID__)) \ 1311 || (defined __arm__ && (defined __ARM_EABI__ || defined __EABI__ || defined __VFP_FP__ || defined _WIN32_WCE || defined __ANDROID__)) \
1110 || defined __aarch64__ 1312 || defined __aarch64__
1111 #define ECB_STDFP 1 1313 #define ECB_STDFP 1
1112 #include <string.h> /* for memcpy */ 1314 #include <string.h> /* for memcpy */
1113#else 1315#else
1129 #define ECB_NAN NAN 1331 #define ECB_NAN NAN
1130 #else 1332 #else
1131 #define ECB_NAN ECB_INFINITY 1333 #define ECB_NAN ECB_INFINITY
1132 #endif 1334 #endif
1133 1335
1134 /* converts an ieee half/binary16 to a float */ 1336 #if ECB_C99 || _XOPEN_VERSION >= 600 || _POSIX_VERSION >= 200112L
1135 ecb_function_ float ecb_binary16_to_float (uint16_t x) ecb_const; 1337 #define ecb_ldexpf(x,e) ldexpf ((x), (e))
1136 ecb_function_ float 1338 #define ecb_frexpf(x,e) frexpf ((x), (e))
1137 ecb_binary16_to_float (uint16_t x) 1339 #else
1138 { 1340 #define ecb_ldexpf(x,e) (float) ldexp ((double) (x), (e))
1139 int e = (x >> 10) & 0x1f; 1341 #define ecb_frexpf(x,e) (float) frexp ((double) (x), (e))
1140 int m = x & 0x3ff; 1342 #endif
1141 float r;
1142
1143 if (!e ) r = ldexpf (m , -24);
1144 else if (e != 31) r = ldexpf (m + 0x400, e - 25);
1145 else if (m ) r = ECB_NAN;
1146 else r = ECB_INFINITY;
1147
1148 return x & 0x8000 ? -r : r;
1149 }
1150 1343
1151 /* convert a float to ieee single/binary32 */ 1344 /* convert a float to ieee single/binary32 */
1152 ecb_function_ uint32_t ecb_float_to_binary32 (float x) ecb_const; 1345 ecb_function_ ecb_const uint32_t ecb_float_to_binary32 (float x);
1153 ecb_function_ uint32_t 1346 ecb_function_ ecb_const uint32_t
1154 ecb_float_to_binary32 (float x) 1347 ecb_float_to_binary32 (float x)
1155 { 1348 {
1156 uint32_t r; 1349 uint32_t r;
1157 1350
1158 #if ECB_STDFP 1351 #if ECB_STDFP
1165 if (x == 0e0f ) return 0x00000000U; 1358 if (x == 0e0f ) return 0x00000000U;
1166 if (x > +3.40282346638528860e+38f) return 0x7f800000U; 1359 if (x > +3.40282346638528860e+38f) return 0x7f800000U;
1167 if (x < -3.40282346638528860e+38f) return 0xff800000U; 1360 if (x < -3.40282346638528860e+38f) return 0xff800000U;
1168 if (x != x ) return 0x7fbfffffU; 1361 if (x != x ) return 0x7fbfffffU;
1169 1362
1170 m = frexpf (x, &e) * 0x1000000U; 1363 m = ecb_frexpf (x, &e) * 0x1000000U;
1171 1364
1172 r = m & 0x80000000U; 1365 r = m & 0x80000000U;
1173 1366
1174 if (r) 1367 if (r)
1175 m = -m; 1368 m = -m;
1187 1380
1188 return r; 1381 return r;
1189 } 1382 }
1190 1383
1191 /* converts an ieee single/binary32 to a float */ 1384 /* converts an ieee single/binary32 to a float */
1192 ecb_function_ float ecb_binary32_to_float (uint32_t x) ecb_const; 1385 ecb_function_ ecb_const float ecb_binary32_to_float (uint32_t x);
1193 ecb_function_ float 1386 ecb_function_ ecb_const float
1194 ecb_binary32_to_float (uint32_t x) 1387 ecb_binary32_to_float (uint32_t x)
1195 { 1388 {
1196 float r; 1389 float r;
1197 1390
1198 #if ECB_STDFP 1391 #if ECB_STDFP
1208 x |= 0x800000U; 1401 x |= 0x800000U;
1209 else 1402 else
1210 e = 1; 1403 e = 1;
1211 1404
1212 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */ 1405 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */
1213 r = ldexpf (x * (0.5f / 0x800000U), e - 126); 1406 r = ecb_ldexpf (x * (0.5f / 0x800000U), e - 126);
1214 1407
1215 r = neg ? -r : r; 1408 r = neg ? -r : r;
1216 #endif 1409 #endif
1217 1410
1218 return r; 1411 return r;
1219 } 1412 }
1220 1413
1221 /* convert a double to ieee double/binary64 */ 1414 /* convert a double to ieee double/binary64 */
1222 ecb_function_ uint64_t ecb_double_to_binary64 (double x) ecb_const; 1415 ecb_function_ ecb_const uint64_t ecb_double_to_binary64 (double x);
1223 ecb_function_ uint64_t 1416 ecb_function_ ecb_const uint64_t
1224 ecb_double_to_binary64 (double x) 1417 ecb_double_to_binary64 (double x)
1225 { 1418 {
1226 uint64_t r; 1419 uint64_t r;
1227 1420
1228 #if ECB_STDFP 1421 #if ECB_STDFP
1257 1450
1258 return r; 1451 return r;
1259 } 1452 }
1260 1453
1261 /* converts an ieee double/binary64 to a double */ 1454 /* converts an ieee double/binary64 to a double */
1262 ecb_function_ double ecb_binary64_to_double (uint64_t x) ecb_const; 1455 ecb_function_ ecb_const double ecb_binary64_to_double (uint64_t x);
1263 ecb_function_ double 1456 ecb_function_ ecb_const double
1264 ecb_binary64_to_double (uint64_t x) 1457 ecb_binary64_to_double (uint64_t x)
1265 { 1458 {
1266 double r; 1459 double r;
1267 1460
1268 #if ECB_STDFP 1461 #if ECB_STDFP
1284 1477
1285 r = neg ? -r : r; 1478 r = neg ? -r : r;
1286 #endif 1479 #endif
1287 1480
1288 return r; 1481 return r;
1482 }
1483
1484 /* convert a float to ieee half/binary16 */
1485 ecb_function_ ecb_const uint16_t ecb_float_to_binary16 (float x);
1486 ecb_function_ ecb_const uint16_t
1487 ecb_float_to_binary16 (float x)
1488 {
1489 return ecb_binary32_to_binary16 (ecb_float_to_binary32 (x));
1490 }
1491
1492 /* convert an ieee half/binary16 to float */
1493 ecb_function_ ecb_const float ecb_binary16_to_float (uint16_t x);
1494 ecb_function_ ecb_const float
1495 ecb_binary16_to_float (uint16_t x)
1496 {
1497 return ecb_binary32_to_float (ecb_binary16_to_binary32 (x));
1289 } 1498 }
1290 1499
1291#endif 1500#endif
1292 1501
1293#endif 1502#endif
2604{ 2813{
2605 invoke_cb = invoke_pending_cb; 2814 invoke_cb = invoke_pending_cb;
2606} 2815}
2607 2816
2608void 2817void
2609ev_set_loop_release_cb (EV_P_ ev_loop_callback_nothrow release, ev_loop_callback_nothrow acquire) EV_THROW 2818ev_set_loop_release_cb (EV_P_ void (*release)(EV_P) EV_THROW, void (*acquire)(EV_P) EV_THROW) EV_THROW
2610{ 2819{
2611 release_cb = release; 2820 release_cb = release;
2612 acquire_cb = acquire; 2821 acquire_cb = acquire;
2613} 2822}
2614#endif 2823#endif
2840#if EV_USE_INOTIFY 3049#if EV_USE_INOTIFY
2841 infy_fork (EV_A); 3050 infy_fork (EV_A);
2842#endif 3051#endif
2843 3052
2844#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE 3053#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE
2845 if (ev_is_active (&pipe_w)) 3054 if (ev_is_active (&pipe_w) && postfork != 2)
2846 { 3055 {
2847 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */ 3056 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */
2848 3057
2849 ev_ref (EV_A); 3058 ev_ref (EV_A);
2850 ev_io_stop (EV_A_ &pipe_w); 3059 ev_io_stop (EV_A_ &pipe_w);

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines