ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/libev/ev.c
(Generate patch)

Comparing libev/ev.c (file contents):
Revision 1.456 by root, Thu Jul 4 22:32:23 2013 UTC vs.
Revision 1.479 by root, Sun Dec 20 01:31:17 2015 UTC

1/* 1/*
2 * libev event processing core, watcher management 2 * libev event processing core, watcher management
3 * 3 *
4 * Copyright (c) 2007,2008,2009,2010,2011,2012 Marc Alexander Lehmann <libev@schmorp.de> 4 * Copyright (c) 2007,2008,2009,2010,2011,2012,2013 Marc Alexander Lehmann <libev@schmorp.de>
5 * All rights reserved. 5 * All rights reserved.
6 * 6 *
7 * Redistribution and use in source and binary forms, with or without modifica- 7 * Redistribution and use in source and binary forms, with or without modifica-
8 * tion, are permitted provided that the following conditions are met: 8 * tion, are permitted provided that the following conditions are met:
9 * 9 *
43# include EV_CONFIG_H 43# include EV_CONFIG_H
44# else 44# else
45# include "config.h" 45# include "config.h"
46# endif 46# endif
47 47
48#if HAVE_FLOOR 48# if HAVE_FLOOR
49# ifndef EV_USE_FLOOR 49# ifndef EV_USE_FLOOR
50# define EV_USE_FLOOR 1 50# define EV_USE_FLOOR 1
51# endif
51# endif 52# endif
52#endif
53 53
54# if HAVE_CLOCK_SYSCALL 54# if HAVE_CLOCK_SYSCALL
55# ifndef EV_USE_CLOCK_SYSCALL 55# ifndef EV_USE_CLOCK_SYSCALL
56# define EV_USE_CLOCK_SYSCALL 1 56# define EV_USE_CLOCK_SYSCALL 1
57# ifndef EV_USE_REALTIME 57# ifndef EV_USE_REALTIME
241#elif defined SIGARRAYSIZE 241#elif defined SIGARRAYSIZE
242# define EV_NSIG (SIGARRAYSIZE) /* Assume ary[SIGARRAYSIZE] */ 242# define EV_NSIG (SIGARRAYSIZE) /* Assume ary[SIGARRAYSIZE] */
243#elif defined _sys_nsig 243#elif defined _sys_nsig
244# define EV_NSIG (_sys_nsig) /* Solaris 2.5 */ 244# define EV_NSIG (_sys_nsig) /* Solaris 2.5 */
245#else 245#else
246# error "unable to find value for NSIG, please report" 246# define EV_NSIG (8 * sizeof (sigset_t) + 1)
247/* to make it compile regardless, just remove the above line, */
248/* but consider reporting it, too! :) */
249# define EV_NSIG 65
250#endif 247#endif
251 248
252#ifndef EV_USE_FLOOR 249#ifndef EV_USE_FLOOR
253# define EV_USE_FLOOR 0 250# define EV_USE_FLOOR 0
254#endif 251#endif
255 252
256#ifndef EV_USE_CLOCK_SYSCALL 253#ifndef EV_USE_CLOCK_SYSCALL
257# if __linux && __GLIBC__ >= 2 254# if __linux && __GLIBC__ == 2 && __GLIBC_MINOR__ < 17
258# define EV_USE_CLOCK_SYSCALL EV_FEATURE_OS 255# define EV_USE_CLOCK_SYSCALL EV_FEATURE_OS
259# else 256# else
260# define EV_USE_CLOCK_SYSCALL 0 257# define EV_USE_CLOCK_SYSCALL 0
258# endif
259#endif
260
261#if !(_POSIX_TIMERS > 0)
262# ifndef EV_USE_MONOTONIC
263# define EV_USE_MONOTONIC 0
264# endif
265# ifndef EV_USE_REALTIME
266# define EV_USE_REALTIME 0
261# endif 267# endif
262#endif 268#endif
263 269
264#ifndef EV_USE_MONOTONIC 270#ifndef EV_USE_MONOTONIC
265# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0 271# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0
485/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */ 491/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */
486/* ECB.H BEGIN */ 492/* ECB.H BEGIN */
487/* 493/*
488 * libecb - http://software.schmorp.de/pkg/libecb 494 * libecb - http://software.schmorp.de/pkg/libecb
489 * 495 *
490 * Copyright (©) 2009-2012 Marc Alexander Lehmann <libecb@schmorp.de> 496 * Copyright (©) 2009-2015 Marc Alexander Lehmann <libecb@schmorp.de>
491 * Copyright (©) 2011 Emanuele Giaquinta 497 * Copyright (©) 2011 Emanuele Giaquinta
492 * All rights reserved. 498 * All rights reserved.
493 * 499 *
494 * Redistribution and use in source and binary forms, with or without modifica- 500 * Redistribution and use in source and binary forms, with or without modifica-
495 * tion, are permitted provided that the following conditions are met: 501 * tion, are permitted provided that the following conditions are met:
509 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; 515 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
510 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, 516 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
511 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH- 517 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH-
512 * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED 518 * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
513 * OF THE POSSIBILITY OF SUCH DAMAGE. 519 * OF THE POSSIBILITY OF SUCH DAMAGE.
520 *
521 * Alternatively, the contents of this file may be used under the terms of
522 * the GNU General Public License ("GPL") version 2 or any later version,
523 * in which case the provisions of the GPL are applicable instead of
524 * the above. If you wish to allow the use of your version of this file
525 * only under the terms of the GPL and not to allow others to use your
526 * version of this file under the BSD license, indicate your decision
527 * by deleting the provisions above and replace them with the notice
528 * and other provisions required by the GPL. If you do not delete the
529 * provisions above, a recipient may use your version of this file under
530 * either the BSD or the GPL.
514 */ 531 */
515 532
516#ifndef ECB_H 533#ifndef ECB_H
517#define ECB_H 534#define ECB_H
518 535
519/* 16 bits major, 16 bits minor */ 536/* 16 bits major, 16 bits minor */
520#define ECB_VERSION 0x00010003 537#define ECB_VERSION 0x00010005
521 538
522#ifdef _WIN32 539#ifdef _WIN32
523 typedef signed char int8_t; 540 typedef signed char int8_t;
524 typedef unsigned char uint8_t; 541 typedef unsigned char uint8_t;
525 typedef signed short int16_t; 542 typedef signed short int16_t;
542 typedef uint32_t uintptr_t; 559 typedef uint32_t uintptr_t;
543 typedef int32_t intptr_t; 560 typedef int32_t intptr_t;
544 #endif 561 #endif
545#else 562#else
546 #include <inttypes.h> 563 #include <inttypes.h>
547 #if UINTMAX_MAX > 0xffffffffU 564 #if (defined INTPTR_MAX ? INTPTR_MAX : ULONG_MAX) > 0xffffffffU
548 #define ECB_PTRSIZE 8 565 #define ECB_PTRSIZE 8
549 #else 566 #else
550 #define ECB_PTRSIZE 4 567 #define ECB_PTRSIZE 4
551 #endif 568 #endif
552#endif 569#endif
553 570
571#define ECB_GCC_AMD64 (__amd64 || __amd64__ || __x86_64 || __x86_64__)
572#define ECB_MSVC_AMD64 (_M_AMD64 || _M_X64)
573
554/* work around x32 idiocy by defining proper macros */ 574/* work around x32 idiocy by defining proper macros */
555#if __x86_64 || _M_AMD64 575#if ECB_GCC_AMD64 || ECB_MSVC_AMD64
556 #if __ILP32 576 #if _ILP32
557 #define ECB_AMD64_X32 1 577 #define ECB_AMD64_X32 1
558 #else 578 #else
559 #define ECB_AMD64 1 579 #define ECB_AMD64 1
560 #endif 580 #endif
561#endif 581#endif
565 * causing enormous grief in return for some better fake benchmark numbers. 585 * causing enormous grief in return for some better fake benchmark numbers.
566 * or so. 586 * or so.
567 * we try to detect these and simply assume they are not gcc - if they have 587 * we try to detect these and simply assume they are not gcc - if they have
568 * an issue with that they should have done it right in the first place. 588 * an issue with that they should have done it right in the first place.
569 */ 589 */
570#ifndef ECB_GCC_VERSION
571 #if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__ 590#if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__
572 #define ECB_GCC_VERSION(major,minor) 0 591 #define ECB_GCC_VERSION(major,minor) 0
573 #else 592#else
574 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor))) 593 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor)))
575 #endif 594#endif
576#endif
577 595
578#define ECB_C (__STDC__+0) /* this assumes that __STDC__ is either empty or a number */ 596#define ECB_CLANG_VERSION(major,minor) (__clang_major__ > (major) || (__clang_major__ == (major) && __clang_minor__ >= (minor)))
579#define ECB_C99 (__STDC_VERSION__ >= 199901L) 597
580#define ECB_C11 (__STDC_VERSION__ >= 201112L) 598#if __clang__ && defined __has_builtin
599 #define ECB_CLANG_BUILTIN(x) __has_builtin (x)
600#else
601 #define ECB_CLANG_BUILTIN(x) 0
602#endif
603
604#if __clang__ && defined __has_extension
605 #define ECB_CLANG_EXTENSION(x) __has_extension (x)
606#else
607 #define ECB_CLANG_EXTENSION(x) 0
608#endif
609
581#define ECB_CPP (__cplusplus+0) 610#define ECB_CPP (__cplusplus+0)
582#define ECB_CPP11 (__cplusplus >= 201103L) 611#define ECB_CPP11 (__cplusplus >= 201103L)
612
613#if ECB_CPP
614 #define ECB_C 0
615 #define ECB_STDC_VERSION 0
616#else
617 #define ECB_C 1
618 #define ECB_STDC_VERSION __STDC_VERSION__
619#endif
620
621#define ECB_C99 (ECB_STDC_VERSION >= 199901L)
622#define ECB_C11 (ECB_STDC_VERSION >= 201112L)
583 623
584#if ECB_CPP 624#if ECB_CPP
585 #define ECB_EXTERN_C extern "C" 625 #define ECB_EXTERN_C extern "C"
586 #define ECB_EXTERN_C_BEG ECB_EXTERN_C { 626 #define ECB_EXTERN_C_BEG ECB_EXTERN_C {
587 #define ECB_EXTERN_C_END } 627 #define ECB_EXTERN_C_END }
600 #define ECB_NO_SMP 1 640 #define ECB_NO_SMP 1
601#endif 641#endif
602 642
603#if ECB_NO_SMP 643#if ECB_NO_SMP
604 #define ECB_MEMORY_FENCE do { } while (0) 644 #define ECB_MEMORY_FENCE do { } while (0)
645#endif
646
647/* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/compiler_ref/compiler_builtins.html */
648#if __xlC__ && ECB_CPP
649 #include <builtins.h>
650#endif
651
652#if 1400 <= _MSC_VER
653 #include <intrin.h> /* fence functions _ReadBarrier, also bit search functions _BitScanReverse */
605#endif 654#endif
606 655
607#ifndef ECB_MEMORY_FENCE 656#ifndef ECB_MEMORY_FENCE
608 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110 657 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110
609 #if __i386 || __i386__ 658 #if __i386 || __i386__
610 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory") 659 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory")
611 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory") 660 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
612 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 661 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
613 #elif __amd64 || __amd64__ || __x86_64 || __x86_64__ 662 #elif ECB_GCC_AMD64
614 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory") 663 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory")
615 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory") 664 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
616 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 665 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
617 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ 666 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__
618 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory") 667 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory")
668 #elif defined __ARM_ARCH_2__ \
669 || defined __ARM_ARCH_3__ || defined __ARM_ARCH_3M__ \
670 || defined __ARM_ARCH_4__ || defined __ARM_ARCH_4T__ \
671 || defined __ARM_ARCH_5__ || defined __ARM_ARCH_5E__ \
672 || defined __ARM_ARCH_5T__ || defined __ARM_ARCH_5TE__ \
673 || defined __ARM_ARCH_5TEJ__
674 /* should not need any, unless running old code on newer cpu - arm doesn't support that */
619 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \ 675 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \
620 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ 676 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ \
677 || defined __ARM_ARCH_6T2__
621 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory") 678 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory")
622 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \ 679 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \
623 || defined __ARM_ARCH_7M__ || defined __ARM_ARCH_7R__ 680 || defined __ARM_ARCH_7R__ || defined __ARM_ARCH_7M__
624 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory") 681 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory")
625 #elif __sparc || __sparc__ 682 #elif __aarch64__
683 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb ish" : : : "memory")
684 #elif (__sparc || __sparc__) && !(__sparc_v8__ || defined __sparcv8)
626 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory") 685 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory")
627 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory") 686 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory")
628 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore") 687 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore")
629 #elif defined __s390__ || defined __s390x__ 688 #elif defined __s390__ || defined __s390x__
630 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory") 689 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory")
631 #elif defined __mips__ 690 #elif defined __mips__
632 /* GNU/Linux emulates sync on mips1 architectures, so we force it's use */ 691 /* GNU/Linux emulates sync on mips1 architectures, so we force its use */
633 /* anybody else who still uses mips1 is supposed to send in their version, with detection code. */ 692 /* anybody else who still uses mips1 is supposed to send in their version, with detection code. */
634 #define ECB_MEMORY_FENCE __asm__ __volatile__ (".set mips2; sync; .set mips0" : : : "memory") 693 #define ECB_MEMORY_FENCE __asm__ __volatile__ (".set mips2; sync; .set mips0" : : : "memory")
635 #elif defined __alpha__ 694 #elif defined __alpha__
636 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mb" : : : "memory") 695 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mb" : : : "memory")
637 #elif defined __hppa__ 696 #elif defined __hppa__
638 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory") 697 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
639 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 698 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
640 #elif defined __ia64__ 699 #elif defined __ia64__
641 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mf" : : : "memory") 700 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mf" : : : "memory")
701 #elif defined __m68k__
702 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
703 #elif defined __m88k__
704 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("tb1 0,%%r0,128" : : : "memory")
705 #elif defined __sh__
706 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
642 #endif 707 #endif
643 #endif 708 #endif
644#endif 709#endif
645 710
646#ifndef ECB_MEMORY_FENCE 711#ifndef ECB_MEMORY_FENCE
647 #if ECB_GCC_VERSION(4,7) 712 #if ECB_GCC_VERSION(4,7)
648 /* see comment below (stdatomic.h) about the C11 memory model. */ 713 /* see comment below (stdatomic.h) about the C11 memory model. */
649 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST) 714 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST)
715 #define ECB_MEMORY_FENCE_ACQUIRE __atomic_thread_fence (__ATOMIC_ACQUIRE)
716 #define ECB_MEMORY_FENCE_RELEASE __atomic_thread_fence (__ATOMIC_RELEASE)
650 717
651 /* The __has_feature syntax from clang is so misdesigned that we cannot use it 718 #elif ECB_CLANG_EXTENSION(c_atomic)
652 * without risking compile time errors with other compilers. We *could*
653 * define our own ecb_clang_has_feature, but I just can't be bothered to work
654 * around this shit time and again.
655 * #elif defined __clang && __has_feature (cxx_atomic)
656 * // see comment below (stdatomic.h) about the C11 memory model. 719 /* see comment below (stdatomic.h) about the C11 memory model. */
657 * #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST) 720 #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST)
658 */ 721 #define ECB_MEMORY_FENCE_ACQUIRE __c11_atomic_thread_fence (__ATOMIC_ACQUIRE)
722 #define ECB_MEMORY_FENCE_RELEASE __c11_atomic_thread_fence (__ATOMIC_RELEASE)
659 723
660 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__ 724 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__
661 #define ECB_MEMORY_FENCE __sync_synchronize () 725 #define ECB_MEMORY_FENCE __sync_synchronize ()
726 #elif _MSC_VER >= 1500 /* VC++ 2008 */
727 /* apparently, microsoft broke all the memory barrier stuff in Visual Studio 2008... */
728 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier)
729 #define ECB_MEMORY_FENCE _ReadWriteBarrier (); MemoryBarrier()
730 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier (); MemoryBarrier() /* according to msdn, _ReadBarrier is not a load fence */
731 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier (); MemoryBarrier()
662 #elif _MSC_VER >= 1400 /* VC++ 2005 */ 732 #elif _MSC_VER >= 1400 /* VC++ 2005 */
663 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier) 733 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier)
664 #define ECB_MEMORY_FENCE _ReadWriteBarrier () 734 #define ECB_MEMORY_FENCE _ReadWriteBarrier ()
665 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier () /* according to msdn, _ReadBarrier is not a load fence */ 735 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier () /* according to msdn, _ReadBarrier is not a load fence */
666 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier () 736 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier ()
686 /* any fence other than seq_cst, which isn't very efficient for us. */ 756 /* any fence other than seq_cst, which isn't very efficient for us. */
687 /* Why that is, we don't know - either the C11 memory model is quite useless */ 757 /* Why that is, we don't know - either the C11 memory model is quite useless */
688 /* for most usages, or gcc and clang have a bug */ 758 /* for most usages, or gcc and clang have a bug */
689 /* I *currently* lean towards the latter, and inefficiently implement */ 759 /* I *currently* lean towards the latter, and inefficiently implement */
690 /* all three of ecb's fences as a seq_cst fence */ 760 /* all three of ecb's fences as a seq_cst fence */
761 /* Update, gcc-4.8 generates mfence for all c++ fences, but nothing */
762 /* for all __atomic_thread_fence's except seq_cst */
691 #define ECB_MEMORY_FENCE atomic_thread_fence (memory_order_seq_cst) 763 #define ECB_MEMORY_FENCE atomic_thread_fence (memory_order_seq_cst)
692 #endif 764 #endif
693#endif 765#endif
694 766
695#ifndef ECB_MEMORY_FENCE 767#ifndef ECB_MEMORY_FENCE
718 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE 790 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE
719#endif 791#endif
720 792
721/*****************************************************************************/ 793/*****************************************************************************/
722 794
723#if __cplusplus 795#if ECB_CPP
724 #define ecb_inline static inline 796 #define ecb_inline static inline
725#elif ECB_GCC_VERSION(2,5) 797#elif ECB_GCC_VERSION(2,5)
726 #define ecb_inline static __inline__ 798 #define ecb_inline static __inline__
727#elif ECB_C99 799#elif ECB_C99
728 #define ecb_inline static inline 800 #define ecb_inline static inline
742 814
743#define ECB_CONCAT_(a, b) a ## b 815#define ECB_CONCAT_(a, b) a ## b
744#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b) 816#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b)
745#define ECB_STRINGIFY_(a) # a 817#define ECB_STRINGIFY_(a) # a
746#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a) 818#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a)
819#define ECB_STRINGIFY_EXPR(expr) ((expr), ECB_STRINGIFY_ (expr))
747 820
748#define ecb_function_ ecb_inline 821#define ecb_function_ ecb_inline
749 822
750#if ECB_GCC_VERSION(3,1) 823#if ECB_GCC_VERSION(3,1) || ECB_CLANG_VERSION(2,8)
751 #define ecb_attribute(attrlist) __attribute__(attrlist) 824 #define ecb_attribute(attrlist) __attribute__ (attrlist)
825#else
826 #define ecb_attribute(attrlist)
827#endif
828
829#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_constant_p)
752 #define ecb_is_constant(expr) __builtin_constant_p (expr) 830 #define ecb_is_constant(expr) __builtin_constant_p (expr)
831#else
832 /* possible C11 impl for integral types
833 typedef struct ecb_is_constant_struct ecb_is_constant_struct;
834 #define ecb_is_constant(expr) _Generic ((1 ? (struct ecb_is_constant_struct *)0 : (void *)((expr) - (expr)), ecb_is_constant_struct *: 0, default: 1)) */
835
836 #define ecb_is_constant(expr) 0
837#endif
838
839#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_expect)
753 #define ecb_expect(expr,value) __builtin_expect ((expr),(value)) 840 #define ecb_expect(expr,value) __builtin_expect ((expr),(value))
841#else
842 #define ecb_expect(expr,value) (expr)
843#endif
844
845#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_prefetch)
754 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality) 846 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality)
755#else 847#else
756 #define ecb_attribute(attrlist)
757 #define ecb_is_constant(expr) 0
758 #define ecb_expect(expr,value) (expr)
759 #define ecb_prefetch(addr,rw,locality) 848 #define ecb_prefetch(addr,rw,locality)
760#endif 849#endif
761 850
762/* no emulation for ecb_decltype */ 851/* no emulation for ecb_decltype */
763#if ECB_GCC_VERSION(4,5) 852#if ECB_CPP11
853 // older implementations might have problems with decltype(x)::type, work around it
854 template<class T> struct ecb_decltype_t { typedef T type; };
764 #define ecb_decltype(x) __decltype(x) 855 #define ecb_decltype(x) ecb_decltype_t<decltype (x)>::type
765#elif ECB_GCC_VERSION(3,0) 856#elif ECB_GCC_VERSION(3,0) || ECB_CLANG_VERSION(2,8)
766 #define ecb_decltype(x) __typeof(x) 857 #define ecb_decltype(x) __typeof__ (x)
767#endif 858#endif
768 859
860#if _MSC_VER >= 1300
861 #define ecb_deprecated __declspec (deprecated)
862#else
863 #define ecb_deprecated ecb_attribute ((__deprecated__))
864#endif
865
866#if _MSC_VER >= 1500
867 #define ecb_deprecated_message(msg) __declspec (deprecated (msg))
868#elif ECB_GCC_VERSION(4,5)
869 #define ecb_deprecated_message(msg) ecb_attribute ((__deprecated__ (msg))
870#else
871 #define ecb_deprecated_message(msg) ecb_deprecated
872#endif
873
874#if _MSC_VER >= 1400
875 #define ecb_noinline __declspec (noinline)
876#else
769#define ecb_noinline ecb_attribute ((__noinline__)) 877 #define ecb_noinline ecb_attribute ((__noinline__))
878#endif
879
770#define ecb_unused ecb_attribute ((__unused__)) 880#define ecb_unused ecb_attribute ((__unused__))
771#define ecb_const ecb_attribute ((__const__)) 881#define ecb_const ecb_attribute ((__const__))
772#define ecb_pure ecb_attribute ((__pure__)) 882#define ecb_pure ecb_attribute ((__pure__))
773 883
774#if ECB_C11 884#if ECB_C11 || __IBMC_NORETURN
885 /* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/language_ref/noreturn.html */
775 #define ecb_noreturn _Noreturn 886 #define ecb_noreturn _Noreturn
887#elif ECB_CPP11
888 #define ecb_noreturn [[noreturn]]
889#elif _MSC_VER >= 1200
890 /* http://msdn.microsoft.com/en-us/library/k6ktzx3s.aspx */
891 #define ecb_noreturn __declspec (noreturn)
776#else 892#else
777 #define ecb_noreturn ecb_attribute ((__noreturn__)) 893 #define ecb_noreturn ecb_attribute ((__noreturn__))
778#endif 894#endif
779 895
780#if ECB_GCC_VERSION(4,3) 896#if ECB_GCC_VERSION(4,3)
795/* for compatibility to the rest of the world */ 911/* for compatibility to the rest of the world */
796#define ecb_likely(expr) ecb_expect_true (expr) 912#define ecb_likely(expr) ecb_expect_true (expr)
797#define ecb_unlikely(expr) ecb_expect_false (expr) 913#define ecb_unlikely(expr) ecb_expect_false (expr)
798 914
799/* count trailing zero bits and count # of one bits */ 915/* count trailing zero bits and count # of one bits */
800#if ECB_GCC_VERSION(3,4) 916#if ECB_GCC_VERSION(3,4) \
917 || (ECB_CLANG_BUILTIN(__builtin_clz) && ECB_CLANG_BUILTIN(__builtin_clzll) \
918 && ECB_CLANG_BUILTIN(__builtin_ctz) && ECB_CLANG_BUILTIN(__builtin_ctzll) \
919 && ECB_CLANG_BUILTIN(__builtin_popcount))
801 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */ 920 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */
802 #define ecb_ld32(x) (__builtin_clz (x) ^ 31) 921 #define ecb_ld32(x) (__builtin_clz (x) ^ 31)
803 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63) 922 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63)
804 #define ecb_ctz32(x) __builtin_ctz (x) 923 #define ecb_ctz32(x) __builtin_ctz (x)
805 #define ecb_ctz64(x) __builtin_ctzll (x) 924 #define ecb_ctz64(x) __builtin_ctzll (x)
806 #define ecb_popcount32(x) __builtin_popcount (x) 925 #define ecb_popcount32(x) __builtin_popcount (x)
807 /* no popcountll */ 926 /* no popcountll */
808#else 927#else
809 ecb_function_ int ecb_ctz32 (uint32_t x) ecb_const; 928 ecb_function_ ecb_const int ecb_ctz32 (uint32_t x);
810 ecb_function_ int 929 ecb_function_ ecb_const int
811 ecb_ctz32 (uint32_t x) 930 ecb_ctz32 (uint32_t x)
812 { 931 {
932#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
933 unsigned long r;
934 _BitScanForward (&r, x);
935 return (int)r;
936#else
813 int r = 0; 937 int r = 0;
814 938
815 x &= ~x + 1; /* this isolates the lowest bit */ 939 x &= ~x + 1; /* this isolates the lowest bit */
816 940
817#if ECB_branchless_on_i386 941#if ECB_branchless_on_i386
827 if (x & 0xff00ff00) r += 8; 951 if (x & 0xff00ff00) r += 8;
828 if (x & 0xffff0000) r += 16; 952 if (x & 0xffff0000) r += 16;
829#endif 953#endif
830 954
831 return r; 955 return r;
956#endif
832 } 957 }
833 958
834 ecb_function_ int ecb_ctz64 (uint64_t x) ecb_const; 959 ecb_function_ ecb_const int ecb_ctz64 (uint64_t x);
835 ecb_function_ int 960 ecb_function_ ecb_const int
836 ecb_ctz64 (uint64_t x) 961 ecb_ctz64 (uint64_t x)
837 { 962 {
963#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
964 unsigned long r;
965 _BitScanForward64 (&r, x);
966 return (int)r;
967#else
838 int shift = x & 0xffffffffU ? 0 : 32; 968 int shift = x & 0xffffffff ? 0 : 32;
839 return ecb_ctz32 (x >> shift) + shift; 969 return ecb_ctz32 (x >> shift) + shift;
970#endif
840 } 971 }
841 972
842 ecb_function_ int ecb_popcount32 (uint32_t x) ecb_const; 973 ecb_function_ ecb_const int ecb_popcount32 (uint32_t x);
843 ecb_function_ int 974 ecb_function_ ecb_const int
844 ecb_popcount32 (uint32_t x) 975 ecb_popcount32 (uint32_t x)
845 { 976 {
846 x -= (x >> 1) & 0x55555555; 977 x -= (x >> 1) & 0x55555555;
847 x = ((x >> 2) & 0x33333333) + (x & 0x33333333); 978 x = ((x >> 2) & 0x33333333) + (x & 0x33333333);
848 x = ((x >> 4) + x) & 0x0f0f0f0f; 979 x = ((x >> 4) + x) & 0x0f0f0f0f;
849 x *= 0x01010101; 980 x *= 0x01010101;
850 981
851 return x >> 24; 982 return x >> 24;
852 } 983 }
853 984
854 ecb_function_ int ecb_ld32 (uint32_t x) ecb_const; 985 ecb_function_ ecb_const int ecb_ld32 (uint32_t x);
855 ecb_function_ int ecb_ld32 (uint32_t x) 986 ecb_function_ ecb_const int ecb_ld32 (uint32_t x)
856 { 987 {
988#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
989 unsigned long r;
990 _BitScanReverse (&r, x);
991 return (int)r;
992#else
857 int r = 0; 993 int r = 0;
858 994
859 if (x >> 16) { x >>= 16; r += 16; } 995 if (x >> 16) { x >>= 16; r += 16; }
860 if (x >> 8) { x >>= 8; r += 8; } 996 if (x >> 8) { x >>= 8; r += 8; }
861 if (x >> 4) { x >>= 4; r += 4; } 997 if (x >> 4) { x >>= 4; r += 4; }
862 if (x >> 2) { x >>= 2; r += 2; } 998 if (x >> 2) { x >>= 2; r += 2; }
863 if (x >> 1) { r += 1; } 999 if (x >> 1) { r += 1; }
864 1000
865 return r; 1001 return r;
1002#endif
866 } 1003 }
867 1004
868 ecb_function_ int ecb_ld64 (uint64_t x) ecb_const; 1005 ecb_function_ ecb_const int ecb_ld64 (uint64_t x);
869 ecb_function_ int ecb_ld64 (uint64_t x) 1006 ecb_function_ ecb_const int ecb_ld64 (uint64_t x)
870 { 1007 {
1008#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
1009 unsigned long r;
1010 _BitScanReverse64 (&r, x);
1011 return (int)r;
1012#else
871 int r = 0; 1013 int r = 0;
872 1014
873 if (x >> 32) { x >>= 32; r += 32; } 1015 if (x >> 32) { x >>= 32; r += 32; }
874 1016
875 return r + ecb_ld32 (x); 1017 return r + ecb_ld32 (x);
1018#endif
876 } 1019 }
877#endif 1020#endif
878 1021
879ecb_function_ ecb_bool ecb_is_pot32 (uint32_t x) ecb_const; 1022ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x);
880ecb_function_ ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); } 1023ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); }
881ecb_function_ ecb_bool ecb_is_pot64 (uint64_t x) ecb_const; 1024ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x);
882ecb_function_ ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); } 1025ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); }
883 1026
884ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) ecb_const; 1027ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x);
885ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) 1028ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x)
886{ 1029{
887 return ( (x * 0x0802U & 0x22110U) 1030 return ( (x * 0x0802U & 0x22110U)
888 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16; 1031 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16;
889} 1032}
890 1033
891ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) ecb_const; 1034ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x);
892ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) 1035ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x)
893{ 1036{
894 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1); 1037 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1);
895 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2); 1038 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2);
896 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4); 1039 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4);
897 x = ( x >> 8 ) | ( x << 8); 1040 x = ( x >> 8 ) | ( x << 8);
898 1041
899 return x; 1042 return x;
900} 1043}
901 1044
902ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) ecb_const; 1045ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x);
903ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) 1046ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x)
904{ 1047{
905 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1); 1048 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1);
906 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2); 1049 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2);
907 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4); 1050 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4);
908 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8); 1051 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8);
911 return x; 1054 return x;
912} 1055}
913 1056
914/* popcount64 is only available on 64 bit cpus as gcc builtin */ 1057/* popcount64 is only available on 64 bit cpus as gcc builtin */
915/* so for this version we are lazy */ 1058/* so for this version we are lazy */
916ecb_function_ int ecb_popcount64 (uint64_t x) ecb_const; 1059ecb_function_ ecb_const int ecb_popcount64 (uint64_t x);
917ecb_function_ int 1060ecb_function_ ecb_const int
918ecb_popcount64 (uint64_t x) 1061ecb_popcount64 (uint64_t x)
919{ 1062{
920 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32); 1063 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32);
921} 1064}
922 1065
923ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) ecb_const; 1066ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count);
924ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) ecb_const; 1067ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count);
925ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) ecb_const; 1068ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count);
926ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) ecb_const; 1069ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count);
927ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) ecb_const; 1070ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count);
928ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) ecb_const; 1071ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count);
929ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) ecb_const; 1072ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count);
930ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) ecb_const; 1073ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count);
931 1074
932ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); } 1075ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); }
933ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); } 1076ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); }
934ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); } 1077ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); }
935ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); } 1078ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); }
936ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); } 1079ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); }
937ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); } 1080ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); }
938ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); } 1081ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); }
939ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); } 1082ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); }
940 1083
941#if ECB_GCC_VERSION(4,3) 1084#if ECB_GCC_VERSION(4,3) || (ECB_CLANG_BUILTIN(__builtin_bswap32) && ECB_CLANG_BUILTIN(__builtin_bswap64))
1085 #if ECB_GCC_VERSION(4,8) || ECB_CLANG_BUILTIN(__builtin_bswap16)
1086 #define ecb_bswap16(x) __builtin_bswap16 (x)
1087 #else
942 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16) 1088 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16)
1089 #endif
943 #define ecb_bswap32(x) __builtin_bswap32 (x) 1090 #define ecb_bswap32(x) __builtin_bswap32 (x)
944 #define ecb_bswap64(x) __builtin_bswap64 (x) 1091 #define ecb_bswap64(x) __builtin_bswap64 (x)
1092#elif _MSC_VER
1093 #include <stdlib.h>
1094 #define ecb_bswap16(x) ((uint16_t)_byteswap_ushort ((uint16_t)(x)))
1095 #define ecb_bswap32(x) ((uint32_t)_byteswap_ulong ((uint32_t)(x)))
1096 #define ecb_bswap64(x) ((uint64_t)_byteswap_uint64 ((uint64_t)(x)))
945#else 1097#else
946 ecb_function_ uint16_t ecb_bswap16 (uint16_t x) ecb_const; 1098 ecb_function_ ecb_const uint16_t ecb_bswap16 (uint16_t x);
947 ecb_function_ uint16_t 1099 ecb_function_ ecb_const uint16_t
948 ecb_bswap16 (uint16_t x) 1100 ecb_bswap16 (uint16_t x)
949 { 1101 {
950 return ecb_rotl16 (x, 8); 1102 return ecb_rotl16 (x, 8);
951 } 1103 }
952 1104
953 ecb_function_ uint32_t ecb_bswap32 (uint32_t x) ecb_const; 1105 ecb_function_ ecb_const uint32_t ecb_bswap32 (uint32_t x);
954 ecb_function_ uint32_t 1106 ecb_function_ ecb_const uint32_t
955 ecb_bswap32 (uint32_t x) 1107 ecb_bswap32 (uint32_t x)
956 { 1108 {
957 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16); 1109 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16);
958 } 1110 }
959 1111
960 ecb_function_ uint64_t ecb_bswap64 (uint64_t x) ecb_const; 1112 ecb_function_ ecb_const uint64_t ecb_bswap64 (uint64_t x);
961 ecb_function_ uint64_t 1113 ecb_function_ ecb_const uint64_t
962 ecb_bswap64 (uint64_t x) 1114 ecb_bswap64 (uint64_t x)
963 { 1115 {
964 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32); 1116 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32);
965 } 1117 }
966#endif 1118#endif
967 1119
968#if ECB_GCC_VERSION(4,5) 1120#if ECB_GCC_VERSION(4,5) || ECB_CLANG_BUILTIN(__builtin_unreachable)
969 #define ecb_unreachable() __builtin_unreachable () 1121 #define ecb_unreachable() __builtin_unreachable ()
970#else 1122#else
971 /* this seems to work fine, but gcc always emits a warning for it :/ */ 1123 /* this seems to work fine, but gcc always emits a warning for it :/ */
972 ecb_inline void ecb_unreachable (void) ecb_noreturn; 1124 ecb_inline ecb_noreturn void ecb_unreachable (void);
973 ecb_inline void ecb_unreachable (void) { } 1125 ecb_inline ecb_noreturn void ecb_unreachable (void) { }
974#endif 1126#endif
975 1127
976/* try to tell the compiler that some condition is definitely true */ 1128/* try to tell the compiler that some condition is definitely true */
977#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0 1129#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0
978 1130
979ecb_inline unsigned char ecb_byteorder_helper (void) ecb_const; 1131ecb_inline ecb_const uint32_t ecb_byteorder_helper (void);
980ecb_inline unsigned char 1132ecb_inline ecb_const uint32_t
981ecb_byteorder_helper (void) 1133ecb_byteorder_helper (void)
982{ 1134{
983 /* the union code still generates code under pressure in gcc, */ 1135 /* the union code still generates code under pressure in gcc, */
984 /* but less than using pointers, and always seems to */ 1136 /* but less than using pointers, and always seems to */
985 /* successfully return a constant. */ 1137 /* successfully return a constant. */
986 /* the reason why we have this horrible preprocessor mess */ 1138 /* the reason why we have this horrible preprocessor mess */
987 /* is to avoid it in all cases, at least on common architectures */ 1139 /* is to avoid it in all cases, at least on common architectures */
988 /* or when using a recent enough gcc version (>= 4.6) */ 1140 /* or when using a recent enough gcc version (>= 4.6) */
989#if __i386 || __i386__ || _M_X86 || __amd64 || __amd64__ || _M_X64
990 return 0x44;
991#elif __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__ 1141#if (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__) \
1142 || ((__i386 || __i386__ || _M_IX86 || ECB_GCC_AMD64 || ECB_MSVC_AMD64) && !__VOS__)
1143 #define ECB_LITTLE_ENDIAN 1
992 return 0x44; 1144 return 0x44332211;
993#elif __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__ 1145#elif (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__) \
1146 || ((__AARCH64EB__ || __MIPSEB__ || __ARMEB__) && !__VOS__)
1147 #define ECB_BIG_ENDIAN 1
994 return 0x11; 1148 return 0x11223344;
995#else 1149#else
996 union 1150 union
997 { 1151 {
1152 uint8_t c[4];
998 uint32_t i; 1153 uint32_t u;
999 uint8_t c;
1000 } u = { 0x11223344 }; 1154 } u = { 0x11, 0x22, 0x33, 0x44 };
1001 return u.c; 1155 return u.u;
1002#endif 1156#endif
1003} 1157}
1004 1158
1005ecb_inline ecb_bool ecb_big_endian (void) ecb_const; 1159ecb_inline ecb_const ecb_bool ecb_big_endian (void);
1006ecb_inline ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11; } 1160ecb_inline ecb_const ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11223344; }
1007ecb_inline ecb_bool ecb_little_endian (void) ecb_const; 1161ecb_inline ecb_const ecb_bool ecb_little_endian (void);
1008ecb_inline ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44; } 1162ecb_inline ecb_const ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44332211; }
1009 1163
1010#if ECB_GCC_VERSION(3,0) || ECB_C99 1164#if ECB_GCC_VERSION(3,0) || ECB_C99
1011 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0)) 1165 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0))
1012#else 1166#else
1013 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n))) 1167 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n)))
1014#endif 1168#endif
1015 1169
1016#if __cplusplus 1170#if ECB_CPP
1017 template<typename T> 1171 template<typename T>
1018 static inline T ecb_div_rd (T val, T div) 1172 static inline T ecb_div_rd (T val, T div)
1019 { 1173 {
1020 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div; 1174 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div;
1021 } 1175 }
1038 } 1192 }
1039#else 1193#else
1040 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0])) 1194 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0]))
1041#endif 1195#endif
1042 1196
1197ecb_function_ ecb_const uint32_t ecb_binary16_to_binary32 (uint32_t x);
1198ecb_function_ ecb_const uint32_t
1199ecb_binary16_to_binary32 (uint32_t x)
1200{
1201 unsigned int s = (x & 0x8000) << (31 - 15);
1202 int e = (x >> 10) & 0x001f;
1203 unsigned int m = x & 0x03ff;
1204
1205 if (ecb_expect_false (e == 31))
1206 /* infinity or NaN */
1207 e = 255 - (127 - 15);
1208 else if (ecb_expect_false (!e))
1209 {
1210 if (ecb_expect_true (!m))
1211 /* zero, handled by code below by forcing e to 0 */
1212 e = 0 - (127 - 15);
1213 else
1214 {
1215 /* subnormal, renormalise */
1216 unsigned int s = 10 - ecb_ld32 (m);
1217
1218 m = (m << s) & 0x3ff; /* mask implicit bit */
1219 e -= s - 1;
1220 }
1221 }
1222
1223 /* e and m now are normalised, or zero, (or inf or nan) */
1224 e += 127 - 15;
1225
1226 return s | (e << 23) | (m << (23 - 10));
1227}
1228
1229ecb_function_ ecb_const uint16_t ecb_binary32_to_binary16 (uint32_t x);
1230ecb_function_ ecb_const uint16_t
1231ecb_binary32_to_binary16 (uint32_t x)
1232{
1233 unsigned int s = (x >> 16) & 0x00008000; /* sign bit, the easy part */
1234 unsigned int e = ((x >> 23) & 0x000000ff) - (127 - 15); /* the desired exponent */
1235 unsigned int m = x & 0x007fffff;
1236
1237 x &= 0x7fffffff;
1238
1239 /* if it's within range of binary16 normals, use fast path */
1240 if (ecb_expect_true (0x38800000 <= x && x <= 0x477fefff))
1241 {
1242 /* mantissa round-to-even */
1243 m += 0x00000fff + ((m >> (23 - 10)) & 1);
1244
1245 /* handle overflow */
1246 if (ecb_expect_false (m >= 0x00800000))
1247 {
1248 m >>= 1;
1249 e += 1;
1250 }
1251
1252 return s | (e << 10) | (m >> (23 - 10));
1253 }
1254
1255 /* handle large numbers and infinity */
1256 if (ecb_expect_true (0x477fefff < x && x <= 0x7f800000))
1257 return s | 0x7c00;
1258
1259 /* handle zero, subnormals and small numbers */
1260 if (ecb_expect_true (x < 0x38800000))
1261 {
1262 /* zero */
1263 if (ecb_expect_true (!x))
1264 return s;
1265
1266 /* handle subnormals */
1267
1268 /* too small, will be zero */
1269 if (e < (14 - 24)) /* might not be sharp, but is good enough */
1270 return s;
1271
1272 m |= 0x00800000; /* make implicit bit explicit */
1273
1274 /* very tricky - we need to round to the nearest e (+10) bit value */
1275 {
1276 unsigned int bits = 14 - e;
1277 unsigned int half = (1 << (bits - 1)) - 1;
1278 unsigned int even = (m >> bits) & 1;
1279
1280 /* if this overflows, we will end up with a normalised number */
1281 m = (m + half + even) >> bits;
1282 }
1283
1284 return s | m;
1285 }
1286
1287 /* handle NaNs, preserve leftmost nan bits, but make sure we don't turn them into infinities */
1288 m >>= 13;
1289
1290 return s | 0x7c00 | m | !m;
1291}
1292
1043/*******************************************************************************/ 1293/*******************************************************************************/
1044/* floating point stuff, can be disabled by defining ECB_NO_LIBM */ 1294/* floating point stuff, can be disabled by defining ECB_NO_LIBM */
1045 1295
1046/* basically, everything uses "ieee pure-endian" floating point numbers */ 1296/* basically, everything uses "ieee pure-endian" floating point numbers */
1047/* the only noteworthy exception is ancient armle, which uses order 43218765 */ 1297/* the only noteworthy exception is ancient armle, which uses order 43218765 */
1048#if 0 \ 1298#if 0 \
1049 || __i386 || __i386__ \ 1299 || __i386 || __i386__ \
1050 || __amd64 || __amd64__ || __x86_64 || __x86_64__ \ 1300 || ECB_GCC_AMD64 \
1051 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \ 1301 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \
1052 || defined __arm__ && defined __ARM_EABI__ \
1053 || defined __s390__ || defined __s390x__ \ 1302 || defined __s390__ || defined __s390x__ \
1054 || defined __mips__ \ 1303 || defined __mips__ \
1055 || defined __alpha__ \ 1304 || defined __alpha__ \
1056 || defined __hppa__ \ 1305 || defined __hppa__ \
1057 || defined __ia64__ \ 1306 || defined __ia64__ \
1307 || defined __m68k__ \
1308 || defined __m88k__ \
1309 || defined __sh__ \
1058 || defined _M_IX86 || defined _M_AMD64 || defined _M_IA64 1310 || defined _M_IX86 || defined ECB_MSVC_AMD64 || defined _M_IA64 \
1311 || (defined __arm__ && (defined __ARM_EABI__ || defined __EABI__ || defined __VFP_FP__ || defined _WIN32_WCE || defined __ANDROID__)) \
1312 || defined __aarch64__
1059 #define ECB_STDFP 1 1313 #define ECB_STDFP 1
1060 #include <string.h> /* for memcpy */ 1314 #include <string.h> /* for memcpy */
1061#else 1315#else
1062 #define ECB_STDFP 0 1316 #define ECB_STDFP 0
1063 #include <math.h> /* for frexp*, ldexp* */
1064#endif 1317#endif
1065 1318
1066#ifndef ECB_NO_LIBM 1319#ifndef ECB_NO_LIBM
1067 1320
1321 #include <math.h> /* for frexp*, ldexp*, INFINITY, NAN */
1322
1323 /* only the oldest of old doesn't have this one. solaris. */
1324 #ifdef INFINITY
1325 #define ECB_INFINITY INFINITY
1326 #else
1327 #define ECB_INFINITY HUGE_VAL
1328 #endif
1329
1330 #ifdef NAN
1331 #define ECB_NAN NAN
1332 #else
1333 #define ECB_NAN ECB_INFINITY
1334 #endif
1335
1336 #if ECB_C99 || _XOPEN_VERSION >= 600 || _POSIX_VERSION >= 200112L
1337 #define ecb_ldexpf(x,e) ldexpf ((x), (e))
1338 #define ecb_frexpf(x,e) frexpf ((x), (e))
1339 #else
1340 #define ecb_ldexpf(x,e) (float) ldexp ((double) (x), (e))
1341 #define ecb_frexpf(x,e) (float) frexp ((double) (x), (e))
1342 #endif
1343
1068 /* convert a float to ieee single/binary32 */ 1344 /* convert a float to ieee single/binary32 */
1069 ecb_function_ uint32_t ecb_float_to_binary32 (float x) ecb_const; 1345 ecb_function_ ecb_const uint32_t ecb_float_to_binary32 (float x);
1070 ecb_function_ uint32_t 1346 ecb_function_ ecb_const uint32_t
1071 ecb_float_to_binary32 (float x) 1347 ecb_float_to_binary32 (float x)
1072 { 1348 {
1073 uint32_t r; 1349 uint32_t r;
1074 1350
1075 #if ECB_STDFP 1351 #if ECB_STDFP
1082 if (x == 0e0f ) return 0x00000000U; 1358 if (x == 0e0f ) return 0x00000000U;
1083 if (x > +3.40282346638528860e+38f) return 0x7f800000U; 1359 if (x > +3.40282346638528860e+38f) return 0x7f800000U;
1084 if (x < -3.40282346638528860e+38f) return 0xff800000U; 1360 if (x < -3.40282346638528860e+38f) return 0xff800000U;
1085 if (x != x ) return 0x7fbfffffU; 1361 if (x != x ) return 0x7fbfffffU;
1086 1362
1087 m = frexpf (x, &e) * 0x1000000U; 1363 m = ecb_frexpf (x, &e) * 0x1000000U;
1088 1364
1089 r = m & 0x80000000U; 1365 r = m & 0x80000000U;
1090 1366
1091 if (r) 1367 if (r)
1092 m = -m; 1368 m = -m;
1104 1380
1105 return r; 1381 return r;
1106 } 1382 }
1107 1383
1108 /* converts an ieee single/binary32 to a float */ 1384 /* converts an ieee single/binary32 to a float */
1109 ecb_function_ float ecb_binary32_to_float (uint32_t x) ecb_const; 1385 ecb_function_ ecb_const float ecb_binary32_to_float (uint32_t x);
1110 ecb_function_ float 1386 ecb_function_ ecb_const float
1111 ecb_binary32_to_float (uint32_t x) 1387 ecb_binary32_to_float (uint32_t x)
1112 { 1388 {
1113 float r; 1389 float r;
1114 1390
1115 #if ECB_STDFP 1391 #if ECB_STDFP
1125 x |= 0x800000U; 1401 x |= 0x800000U;
1126 else 1402 else
1127 e = 1; 1403 e = 1;
1128 1404
1129 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */ 1405 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */
1130 r = ldexpf (x * (0.5f / 0x800000U), e - 126); 1406 r = ecb_ldexpf (x * (0.5f / 0x800000U), e - 126);
1131 1407
1132 r = neg ? -r : r; 1408 r = neg ? -r : r;
1133 #endif 1409 #endif
1134 1410
1135 return r; 1411 return r;
1136 } 1412 }
1137 1413
1138 /* convert a double to ieee double/binary64 */ 1414 /* convert a double to ieee double/binary64 */
1139 ecb_function_ uint64_t ecb_double_to_binary64 (double x) ecb_const; 1415 ecb_function_ ecb_const uint64_t ecb_double_to_binary64 (double x);
1140 ecb_function_ uint64_t 1416 ecb_function_ ecb_const uint64_t
1141 ecb_double_to_binary64 (double x) 1417 ecb_double_to_binary64 (double x)
1142 { 1418 {
1143 uint64_t r; 1419 uint64_t r;
1144 1420
1145 #if ECB_STDFP 1421 #if ECB_STDFP
1174 1450
1175 return r; 1451 return r;
1176 } 1452 }
1177 1453
1178 /* converts an ieee double/binary64 to a double */ 1454 /* converts an ieee double/binary64 to a double */
1179 ecb_function_ double ecb_binary64_to_double (uint64_t x) ecb_const; 1455 ecb_function_ ecb_const double ecb_binary64_to_double (uint64_t x);
1180 ecb_function_ double 1456 ecb_function_ ecb_const double
1181 ecb_binary64_to_double (uint64_t x) 1457 ecb_binary64_to_double (uint64_t x)
1182 { 1458 {
1183 double r; 1459 double r;
1184 1460
1185 #if ECB_STDFP 1461 #if ECB_STDFP
1201 1477
1202 r = neg ? -r : r; 1478 r = neg ? -r : r;
1203 #endif 1479 #endif
1204 1480
1205 return r; 1481 return r;
1482 }
1483
1484 /* convert a float to ieee half/binary16 */
1485 ecb_function_ ecb_const uint16_t ecb_float_to_binary16 (float x);
1486 ecb_function_ ecb_const uint16_t
1487 ecb_float_to_binary16 (float x)
1488 {
1489 return ecb_binary32_to_binary16 (ecb_float_to_binary32 (x));
1490 }
1491
1492 /* convert an ieee half/binary16 to float */
1493 ecb_function_ ecb_const float ecb_binary16_to_float (uint16_t x);
1494 ecb_function_ ecb_const float
1495 ecb_binary16_to_float (uint16_t x)
1496 {
1497 return ecb_binary32_to_float (ecb_binary16_to_binary32 (x));
1206 } 1498 }
1207 1499
1208#endif 1500#endif
1209 1501
1210#endif 1502#endif
2515{ 2807{
2516 return userdata; 2808 return userdata;
2517} 2809}
2518 2810
2519void 2811void
2520ev_set_invoke_pending_cb (EV_P_ void (*invoke_pending_cb)(EV_P)) EV_THROW 2812ev_set_invoke_pending_cb (EV_P_ ev_loop_callback invoke_pending_cb) EV_THROW
2521{ 2813{
2522 invoke_cb = invoke_pending_cb; 2814 invoke_cb = invoke_pending_cb;
2523} 2815}
2524 2816
2525void 2817void
2757#if EV_USE_INOTIFY 3049#if EV_USE_INOTIFY
2758 infy_fork (EV_A); 3050 infy_fork (EV_A);
2759#endif 3051#endif
2760 3052
2761#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE 3053#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE
2762 if (ev_is_active (&pipe_w)) 3054 if (ev_is_active (&pipe_w) && postfork != 2)
2763 { 3055 {
2764 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */ 3056 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */
2765 3057
2766 ev_ref (EV_A); 3058 ev_ref (EV_A);
2767 ev_io_stop (EV_A_ &pipe_w); 3059 ev_io_stop (EV_A_ &pipe_w);

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines