ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/libev/ev.c
(Generate patch)

Comparing libev/ev.c (file contents):
Revision 1.453 by root, Thu Feb 28 00:33:25 2013 UTC vs.
Revision 1.479 by root, Sun Dec 20 01:31:17 2015 UTC

1/* 1/*
2 * libev event processing core, watcher management 2 * libev event processing core, watcher management
3 * 3 *
4 * Copyright (c) 2007,2008,2009,2010,2011,2012 Marc Alexander Lehmann <libev@schmorp.de> 4 * Copyright (c) 2007,2008,2009,2010,2011,2012,2013 Marc Alexander Lehmann <libev@schmorp.de>
5 * All rights reserved. 5 * All rights reserved.
6 * 6 *
7 * Redistribution and use in source and binary forms, with or without modifica- 7 * Redistribution and use in source and binary forms, with or without modifica-
8 * tion, are permitted provided that the following conditions are met: 8 * tion, are permitted provided that the following conditions are met:
9 * 9 *
43# include EV_CONFIG_H 43# include EV_CONFIG_H
44# else 44# else
45# include "config.h" 45# include "config.h"
46# endif 46# endif
47 47
48#if HAVE_FLOOR 48# if HAVE_FLOOR
49# ifndef EV_USE_FLOOR 49# ifndef EV_USE_FLOOR
50# define EV_USE_FLOOR 1 50# define EV_USE_FLOOR 1
51# endif
51# endif 52# endif
52#endif
53 53
54# if HAVE_CLOCK_SYSCALL 54# if HAVE_CLOCK_SYSCALL
55# ifndef EV_USE_CLOCK_SYSCALL 55# ifndef EV_USE_CLOCK_SYSCALL
56# define EV_USE_CLOCK_SYSCALL 1 56# define EV_USE_CLOCK_SYSCALL 1
57# ifndef EV_USE_REALTIME 57# ifndef EV_USE_REALTIME
241#elif defined SIGARRAYSIZE 241#elif defined SIGARRAYSIZE
242# define EV_NSIG (SIGARRAYSIZE) /* Assume ary[SIGARRAYSIZE] */ 242# define EV_NSIG (SIGARRAYSIZE) /* Assume ary[SIGARRAYSIZE] */
243#elif defined _sys_nsig 243#elif defined _sys_nsig
244# define EV_NSIG (_sys_nsig) /* Solaris 2.5 */ 244# define EV_NSIG (_sys_nsig) /* Solaris 2.5 */
245#else 245#else
246# error "unable to find value for NSIG, please report" 246# define EV_NSIG (8 * sizeof (sigset_t) + 1)
247/* to make it compile regardless, just remove the above line, */
248/* but consider reporting it, too! :) */
249# define EV_NSIG 65
250#endif 247#endif
251 248
252#ifndef EV_USE_FLOOR 249#ifndef EV_USE_FLOOR
253# define EV_USE_FLOOR 0 250# define EV_USE_FLOOR 0
254#endif 251#endif
255 252
256#ifndef EV_USE_CLOCK_SYSCALL 253#ifndef EV_USE_CLOCK_SYSCALL
257# if __linux && __GLIBC__ >= 2 254# if __linux && __GLIBC__ == 2 && __GLIBC_MINOR__ < 17
258# define EV_USE_CLOCK_SYSCALL EV_FEATURE_OS 255# define EV_USE_CLOCK_SYSCALL EV_FEATURE_OS
259# else 256# else
260# define EV_USE_CLOCK_SYSCALL 0 257# define EV_USE_CLOCK_SYSCALL 0
258# endif
259#endif
260
261#if !(_POSIX_TIMERS > 0)
262# ifndef EV_USE_MONOTONIC
263# define EV_USE_MONOTONIC 0
264# endif
265# ifndef EV_USE_REALTIME
266# define EV_USE_REALTIME 0
261# endif 267# endif
262#endif 268#endif
263 269
264#ifndef EV_USE_MONOTONIC 270#ifndef EV_USE_MONOTONIC
265# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0 271# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0
485/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */ 491/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */
486/* ECB.H BEGIN */ 492/* ECB.H BEGIN */
487/* 493/*
488 * libecb - http://software.schmorp.de/pkg/libecb 494 * libecb - http://software.schmorp.de/pkg/libecb
489 * 495 *
490 * Copyright (©) 2009-2012 Marc Alexander Lehmann <libecb@schmorp.de> 496 * Copyright (©) 2009-2015 Marc Alexander Lehmann <libecb@schmorp.de>
491 * Copyright (©) 2011 Emanuele Giaquinta 497 * Copyright (©) 2011 Emanuele Giaquinta
492 * All rights reserved. 498 * All rights reserved.
493 * 499 *
494 * Redistribution and use in source and binary forms, with or without modifica- 500 * Redistribution and use in source and binary forms, with or without modifica-
495 * tion, are permitted provided that the following conditions are met: 501 * tion, are permitted provided that the following conditions are met:
509 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; 515 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
510 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, 516 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
511 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH- 517 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH-
512 * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED 518 * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
513 * OF THE POSSIBILITY OF SUCH DAMAGE. 519 * OF THE POSSIBILITY OF SUCH DAMAGE.
520 *
521 * Alternatively, the contents of this file may be used under the terms of
522 * the GNU General Public License ("GPL") version 2 or any later version,
523 * in which case the provisions of the GPL are applicable instead of
524 * the above. If you wish to allow the use of your version of this file
525 * only under the terms of the GPL and not to allow others to use your
526 * version of this file under the BSD license, indicate your decision
527 * by deleting the provisions above and replace them with the notice
528 * and other provisions required by the GPL. If you do not delete the
529 * provisions above, a recipient may use your version of this file under
530 * either the BSD or the GPL.
514 */ 531 */
515 532
516#ifndef ECB_H 533#ifndef ECB_H
517#define ECB_H 534#define ECB_H
518 535
519/* 16 bits major, 16 bits minor */ 536/* 16 bits major, 16 bits minor */
520#define ECB_VERSION 0x00010002 537#define ECB_VERSION 0x00010005
521 538
522#ifdef _WIN32 539#ifdef _WIN32
523 typedef signed char int8_t; 540 typedef signed char int8_t;
524 typedef unsigned char uint8_t; 541 typedef unsigned char uint8_t;
525 typedef signed short int16_t; 542 typedef signed short int16_t;
542 typedef uint32_t uintptr_t; 559 typedef uint32_t uintptr_t;
543 typedef int32_t intptr_t; 560 typedef int32_t intptr_t;
544 #endif 561 #endif
545#else 562#else
546 #include <inttypes.h> 563 #include <inttypes.h>
547 #if UINTMAX_MAX > 0xffffffffU 564 #if (defined INTPTR_MAX ? INTPTR_MAX : ULONG_MAX) > 0xffffffffU
548 #define ECB_PTRSIZE 8 565 #define ECB_PTRSIZE 8
549 #else 566 #else
550 #define ECB_PTRSIZE 4 567 #define ECB_PTRSIZE 4
568 #endif
569#endif
570
571#define ECB_GCC_AMD64 (__amd64 || __amd64__ || __x86_64 || __x86_64__)
572#define ECB_MSVC_AMD64 (_M_AMD64 || _M_X64)
573
574/* work around x32 idiocy by defining proper macros */
575#if ECB_GCC_AMD64 || ECB_MSVC_AMD64
576 #if _ILP32
577 #define ECB_AMD64_X32 1
578 #else
579 #define ECB_AMD64 1
551 #endif 580 #endif
552#endif 581#endif
553 582
554/* many compilers define _GNUC_ to some versions but then only implement 583/* many compilers define _GNUC_ to some versions but then only implement
555 * what their idiot authors think are the "more important" extensions, 584 * what their idiot authors think are the "more important" extensions,
556 * causing enormous grief in return for some better fake benchmark numbers. 585 * causing enormous grief in return for some better fake benchmark numbers.
557 * or so. 586 * or so.
558 * we try to detect these and simply assume they are not gcc - if they have 587 * we try to detect these and simply assume they are not gcc - if they have
559 * an issue with that they should have done it right in the first place. 588 * an issue with that they should have done it right in the first place.
560 */ 589 */
561#ifndef ECB_GCC_VERSION
562 #if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__ 590#if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__
563 #define ECB_GCC_VERSION(major,minor) 0 591 #define ECB_GCC_VERSION(major,minor) 0
564 #else 592#else
565 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor))) 593 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor)))
566 #endif 594#endif
567#endif
568 595
569#define ECB_C (__STDC__+0) /* this assumes that __STDC__ is either empty or a number */ 596#define ECB_CLANG_VERSION(major,minor) (__clang_major__ > (major) || (__clang_major__ == (major) && __clang_minor__ >= (minor)))
570#define ECB_C99 (__STDC_VERSION__ >= 199901L) 597
571#define ECB_C11 (__STDC_VERSION__ >= 201112L) 598#if __clang__ && defined __has_builtin
599 #define ECB_CLANG_BUILTIN(x) __has_builtin (x)
600#else
601 #define ECB_CLANG_BUILTIN(x) 0
602#endif
603
604#if __clang__ && defined __has_extension
605 #define ECB_CLANG_EXTENSION(x) __has_extension (x)
606#else
607 #define ECB_CLANG_EXTENSION(x) 0
608#endif
609
572#define ECB_CPP (__cplusplus+0) 610#define ECB_CPP (__cplusplus+0)
573#define ECB_CPP11 (__cplusplus >= 201103L) 611#define ECB_CPP11 (__cplusplus >= 201103L)
612
613#if ECB_CPP
614 #define ECB_C 0
615 #define ECB_STDC_VERSION 0
616#else
617 #define ECB_C 1
618 #define ECB_STDC_VERSION __STDC_VERSION__
619#endif
620
621#define ECB_C99 (ECB_STDC_VERSION >= 199901L)
622#define ECB_C11 (ECB_STDC_VERSION >= 201112L)
574 623
575#if ECB_CPP 624#if ECB_CPP
576 #define ECB_EXTERN_C extern "C" 625 #define ECB_EXTERN_C extern "C"
577 #define ECB_EXTERN_C_BEG ECB_EXTERN_C { 626 #define ECB_EXTERN_C_BEG ECB_EXTERN_C {
578 #define ECB_EXTERN_C_END } 627 #define ECB_EXTERN_C_END }
591 #define ECB_NO_SMP 1 640 #define ECB_NO_SMP 1
592#endif 641#endif
593 642
594#if ECB_NO_SMP 643#if ECB_NO_SMP
595 #define ECB_MEMORY_FENCE do { } while (0) 644 #define ECB_MEMORY_FENCE do { } while (0)
645#endif
646
647/* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/compiler_ref/compiler_builtins.html */
648#if __xlC__ && ECB_CPP
649 #include <builtins.h>
650#endif
651
652#if 1400 <= _MSC_VER
653 #include <intrin.h> /* fence functions _ReadBarrier, also bit search functions _BitScanReverse */
596#endif 654#endif
597 655
598#ifndef ECB_MEMORY_FENCE 656#ifndef ECB_MEMORY_FENCE
599 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110 657 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110
600 #if __i386 || __i386__ 658 #if __i386 || __i386__
601 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory") 659 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory")
602 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory") 660 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
603 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 661 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
604 #elif __amd64 || __amd64__ || __x86_64 || __x86_64__ 662 #elif ECB_GCC_AMD64
605 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory") 663 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory")
606 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory") 664 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
607 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 665 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
608 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ 666 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__
609 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory") 667 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory")
668 #elif defined __ARM_ARCH_2__ \
669 || defined __ARM_ARCH_3__ || defined __ARM_ARCH_3M__ \
670 || defined __ARM_ARCH_4__ || defined __ARM_ARCH_4T__ \
671 || defined __ARM_ARCH_5__ || defined __ARM_ARCH_5E__ \
672 || defined __ARM_ARCH_5T__ || defined __ARM_ARCH_5TE__ \
673 || defined __ARM_ARCH_5TEJ__
674 /* should not need any, unless running old code on newer cpu - arm doesn't support that */
610 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \ 675 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \
611 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ 676 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ \
677 || defined __ARM_ARCH_6T2__
612 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory") 678 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory")
613 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \ 679 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \
614 || defined __ARM_ARCH_7M__ || defined __ARM_ARCH_7R__ 680 || defined __ARM_ARCH_7R__ || defined __ARM_ARCH_7M__
615 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory") 681 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory")
616 #elif __sparc || __sparc__ 682 #elif __aarch64__
683 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb ish" : : : "memory")
684 #elif (__sparc || __sparc__) && !(__sparc_v8__ || defined __sparcv8)
617 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory") 685 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory")
618 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory") 686 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory")
619 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore") 687 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore")
620 #elif defined __s390__ || defined __s390x__ 688 #elif defined __s390__ || defined __s390x__
621 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory") 689 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory")
622 #elif defined __mips__ 690 #elif defined __mips__
691 /* GNU/Linux emulates sync on mips1 architectures, so we force its use */
692 /* anybody else who still uses mips1 is supposed to send in their version, with detection code. */
623 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory") 693 #define ECB_MEMORY_FENCE __asm__ __volatile__ (".set mips2; sync; .set mips0" : : : "memory")
624 #elif defined __alpha__ 694 #elif defined __alpha__
625 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mb" : : : "memory") 695 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mb" : : : "memory")
626 #elif defined __hppa__ 696 #elif defined __hppa__
627 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory") 697 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
628 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("") 698 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
629 #elif defined __ia64__ 699 #elif defined __ia64__
630 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mf" : : : "memory") 700 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mf" : : : "memory")
701 #elif defined __m68k__
702 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
703 #elif defined __m88k__
704 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("tb1 0,%%r0,128" : : : "memory")
705 #elif defined __sh__
706 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
631 #endif 707 #endif
632 #endif 708 #endif
633#endif 709#endif
634 710
635#ifndef ECB_MEMORY_FENCE 711#ifndef ECB_MEMORY_FENCE
636 #if ECB_GCC_VERSION(4,7) 712 #if ECB_GCC_VERSION(4,7)
637 /* see comment below (stdatomic.h) about the C11 memory model. */ 713 /* see comment below (stdatomic.h) about the C11 memory model. */
638 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST) 714 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST)
715 #define ECB_MEMORY_FENCE_ACQUIRE __atomic_thread_fence (__ATOMIC_ACQUIRE)
716 #define ECB_MEMORY_FENCE_RELEASE __atomic_thread_fence (__ATOMIC_RELEASE)
639 717
640 /* The __has_feature syntax from clang is so misdesigned that we cannot use it 718 #elif ECB_CLANG_EXTENSION(c_atomic)
641 * without risking compile time errors with other compilers. We *could*
642 * define our own ecb_clang_has_feature, but I just can't be bothered to work
643 * around this shit time and again.
644 * #elif defined __clang && __has_feature (cxx_atomic)
645 * // see comment below (stdatomic.h) about the C11 memory model. 719 /* see comment below (stdatomic.h) about the C11 memory model. */
646 * #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST) 720 #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST)
647 */ 721 #define ECB_MEMORY_FENCE_ACQUIRE __c11_atomic_thread_fence (__ATOMIC_ACQUIRE)
722 #define ECB_MEMORY_FENCE_RELEASE __c11_atomic_thread_fence (__ATOMIC_RELEASE)
648 723
649 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__ 724 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__
650 #define ECB_MEMORY_FENCE __sync_synchronize () 725 #define ECB_MEMORY_FENCE __sync_synchronize ()
726 #elif _MSC_VER >= 1500 /* VC++ 2008 */
727 /* apparently, microsoft broke all the memory barrier stuff in Visual Studio 2008... */
728 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier)
729 #define ECB_MEMORY_FENCE _ReadWriteBarrier (); MemoryBarrier()
730 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier (); MemoryBarrier() /* according to msdn, _ReadBarrier is not a load fence */
731 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier (); MemoryBarrier()
651 #elif _MSC_VER >= 1400 /* VC++ 2005 */ 732 #elif _MSC_VER >= 1400 /* VC++ 2005 */
652 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier) 733 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier)
653 #define ECB_MEMORY_FENCE _ReadWriteBarrier () 734 #define ECB_MEMORY_FENCE _ReadWriteBarrier ()
654 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier () /* according to msdn, _ReadBarrier is not a load fence */ 735 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier () /* according to msdn, _ReadBarrier is not a load fence */
655 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier () 736 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier ()
675 /* any fence other than seq_cst, which isn't very efficient for us. */ 756 /* any fence other than seq_cst, which isn't very efficient for us. */
676 /* Why that is, we don't know - either the C11 memory model is quite useless */ 757 /* Why that is, we don't know - either the C11 memory model is quite useless */
677 /* for most usages, or gcc and clang have a bug */ 758 /* for most usages, or gcc and clang have a bug */
678 /* I *currently* lean towards the latter, and inefficiently implement */ 759 /* I *currently* lean towards the latter, and inefficiently implement */
679 /* all three of ecb's fences as a seq_cst fence */ 760 /* all three of ecb's fences as a seq_cst fence */
761 /* Update, gcc-4.8 generates mfence for all c++ fences, but nothing */
762 /* for all __atomic_thread_fence's except seq_cst */
680 #define ECB_MEMORY_FENCE atomic_thread_fence (memory_order_seq_cst) 763 #define ECB_MEMORY_FENCE atomic_thread_fence (memory_order_seq_cst)
681 #endif 764 #endif
682#endif 765#endif
683 766
684#ifndef ECB_MEMORY_FENCE 767#ifndef ECB_MEMORY_FENCE
707 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE 790 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE
708#endif 791#endif
709 792
710/*****************************************************************************/ 793/*****************************************************************************/
711 794
712#if __cplusplus 795#if ECB_CPP
713 #define ecb_inline static inline 796 #define ecb_inline static inline
714#elif ECB_GCC_VERSION(2,5) 797#elif ECB_GCC_VERSION(2,5)
715 #define ecb_inline static __inline__ 798 #define ecb_inline static __inline__
716#elif ECB_C99 799#elif ECB_C99
717 #define ecb_inline static inline 800 #define ecb_inline static inline
731 814
732#define ECB_CONCAT_(a, b) a ## b 815#define ECB_CONCAT_(a, b) a ## b
733#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b) 816#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b)
734#define ECB_STRINGIFY_(a) # a 817#define ECB_STRINGIFY_(a) # a
735#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a) 818#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a)
819#define ECB_STRINGIFY_EXPR(expr) ((expr), ECB_STRINGIFY_ (expr))
736 820
737#define ecb_function_ ecb_inline 821#define ecb_function_ ecb_inline
738 822
739#if ECB_GCC_VERSION(3,1) 823#if ECB_GCC_VERSION(3,1) || ECB_CLANG_VERSION(2,8)
740 #define ecb_attribute(attrlist) __attribute__(attrlist) 824 #define ecb_attribute(attrlist) __attribute__ (attrlist)
825#else
826 #define ecb_attribute(attrlist)
827#endif
828
829#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_constant_p)
741 #define ecb_is_constant(expr) __builtin_constant_p (expr) 830 #define ecb_is_constant(expr) __builtin_constant_p (expr)
831#else
832 /* possible C11 impl for integral types
833 typedef struct ecb_is_constant_struct ecb_is_constant_struct;
834 #define ecb_is_constant(expr) _Generic ((1 ? (struct ecb_is_constant_struct *)0 : (void *)((expr) - (expr)), ecb_is_constant_struct *: 0, default: 1)) */
835
836 #define ecb_is_constant(expr) 0
837#endif
838
839#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_expect)
742 #define ecb_expect(expr,value) __builtin_expect ((expr),(value)) 840 #define ecb_expect(expr,value) __builtin_expect ((expr),(value))
841#else
842 #define ecb_expect(expr,value) (expr)
843#endif
844
845#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_prefetch)
743 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality) 846 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality)
744#else 847#else
745 #define ecb_attribute(attrlist)
746 #define ecb_is_constant(expr) 0
747 #define ecb_expect(expr,value) (expr)
748 #define ecb_prefetch(addr,rw,locality) 848 #define ecb_prefetch(addr,rw,locality)
749#endif 849#endif
750 850
751/* no emulation for ecb_decltype */ 851/* no emulation for ecb_decltype */
752#if ECB_GCC_VERSION(4,5) 852#if ECB_CPP11
853 // older implementations might have problems with decltype(x)::type, work around it
854 template<class T> struct ecb_decltype_t { typedef T type; };
753 #define ecb_decltype(x) __decltype(x) 855 #define ecb_decltype(x) ecb_decltype_t<decltype (x)>::type
754#elif ECB_GCC_VERSION(3,0) 856#elif ECB_GCC_VERSION(3,0) || ECB_CLANG_VERSION(2,8)
755 #define ecb_decltype(x) __typeof(x) 857 #define ecb_decltype(x) __typeof__ (x)
756#endif 858#endif
757 859
860#if _MSC_VER >= 1300
861 #define ecb_deprecated __declspec (deprecated)
862#else
863 #define ecb_deprecated ecb_attribute ((__deprecated__))
864#endif
865
866#if _MSC_VER >= 1500
867 #define ecb_deprecated_message(msg) __declspec (deprecated (msg))
868#elif ECB_GCC_VERSION(4,5)
869 #define ecb_deprecated_message(msg) ecb_attribute ((__deprecated__ (msg))
870#else
871 #define ecb_deprecated_message(msg) ecb_deprecated
872#endif
873
874#if _MSC_VER >= 1400
875 #define ecb_noinline __declspec (noinline)
876#else
758#define ecb_noinline ecb_attribute ((__noinline__)) 877 #define ecb_noinline ecb_attribute ((__noinline__))
878#endif
879
759#define ecb_unused ecb_attribute ((__unused__)) 880#define ecb_unused ecb_attribute ((__unused__))
760#define ecb_const ecb_attribute ((__const__)) 881#define ecb_const ecb_attribute ((__const__))
761#define ecb_pure ecb_attribute ((__pure__)) 882#define ecb_pure ecb_attribute ((__pure__))
762 883
763#if ECB_C11 884#if ECB_C11 || __IBMC_NORETURN
885 /* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/language_ref/noreturn.html */
764 #define ecb_noreturn _Noreturn 886 #define ecb_noreturn _Noreturn
887#elif ECB_CPP11
888 #define ecb_noreturn [[noreturn]]
889#elif _MSC_VER >= 1200
890 /* http://msdn.microsoft.com/en-us/library/k6ktzx3s.aspx */
891 #define ecb_noreturn __declspec (noreturn)
765#else 892#else
766 #define ecb_noreturn ecb_attribute ((__noreturn__)) 893 #define ecb_noreturn ecb_attribute ((__noreturn__))
767#endif 894#endif
768 895
769#if ECB_GCC_VERSION(4,3) 896#if ECB_GCC_VERSION(4,3)
784/* for compatibility to the rest of the world */ 911/* for compatibility to the rest of the world */
785#define ecb_likely(expr) ecb_expect_true (expr) 912#define ecb_likely(expr) ecb_expect_true (expr)
786#define ecb_unlikely(expr) ecb_expect_false (expr) 913#define ecb_unlikely(expr) ecb_expect_false (expr)
787 914
788/* count trailing zero bits and count # of one bits */ 915/* count trailing zero bits and count # of one bits */
789#if ECB_GCC_VERSION(3,4) 916#if ECB_GCC_VERSION(3,4) \
917 || (ECB_CLANG_BUILTIN(__builtin_clz) && ECB_CLANG_BUILTIN(__builtin_clzll) \
918 && ECB_CLANG_BUILTIN(__builtin_ctz) && ECB_CLANG_BUILTIN(__builtin_ctzll) \
919 && ECB_CLANG_BUILTIN(__builtin_popcount))
790 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */ 920 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */
791 #define ecb_ld32(x) (__builtin_clz (x) ^ 31) 921 #define ecb_ld32(x) (__builtin_clz (x) ^ 31)
792 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63) 922 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63)
793 #define ecb_ctz32(x) __builtin_ctz (x) 923 #define ecb_ctz32(x) __builtin_ctz (x)
794 #define ecb_ctz64(x) __builtin_ctzll (x) 924 #define ecb_ctz64(x) __builtin_ctzll (x)
795 #define ecb_popcount32(x) __builtin_popcount (x) 925 #define ecb_popcount32(x) __builtin_popcount (x)
796 /* no popcountll */ 926 /* no popcountll */
797#else 927#else
798 ecb_function_ int ecb_ctz32 (uint32_t x) ecb_const; 928 ecb_function_ ecb_const int ecb_ctz32 (uint32_t x);
799 ecb_function_ int 929 ecb_function_ ecb_const int
800 ecb_ctz32 (uint32_t x) 930 ecb_ctz32 (uint32_t x)
801 { 931 {
932#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
933 unsigned long r;
934 _BitScanForward (&r, x);
935 return (int)r;
936#else
802 int r = 0; 937 int r = 0;
803 938
804 x &= ~x + 1; /* this isolates the lowest bit */ 939 x &= ~x + 1; /* this isolates the lowest bit */
805 940
806#if ECB_branchless_on_i386 941#if ECB_branchless_on_i386
816 if (x & 0xff00ff00) r += 8; 951 if (x & 0xff00ff00) r += 8;
817 if (x & 0xffff0000) r += 16; 952 if (x & 0xffff0000) r += 16;
818#endif 953#endif
819 954
820 return r; 955 return r;
956#endif
821 } 957 }
822 958
823 ecb_function_ int ecb_ctz64 (uint64_t x) ecb_const; 959 ecb_function_ ecb_const int ecb_ctz64 (uint64_t x);
824 ecb_function_ int 960 ecb_function_ ecb_const int
825 ecb_ctz64 (uint64_t x) 961 ecb_ctz64 (uint64_t x)
826 { 962 {
963#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
964 unsigned long r;
965 _BitScanForward64 (&r, x);
966 return (int)r;
967#else
827 int shift = x & 0xffffffffU ? 0 : 32; 968 int shift = x & 0xffffffff ? 0 : 32;
828 return ecb_ctz32 (x >> shift) + shift; 969 return ecb_ctz32 (x >> shift) + shift;
970#endif
829 } 971 }
830 972
831 ecb_function_ int ecb_popcount32 (uint32_t x) ecb_const; 973 ecb_function_ ecb_const int ecb_popcount32 (uint32_t x);
832 ecb_function_ int 974 ecb_function_ ecb_const int
833 ecb_popcount32 (uint32_t x) 975 ecb_popcount32 (uint32_t x)
834 { 976 {
835 x -= (x >> 1) & 0x55555555; 977 x -= (x >> 1) & 0x55555555;
836 x = ((x >> 2) & 0x33333333) + (x & 0x33333333); 978 x = ((x >> 2) & 0x33333333) + (x & 0x33333333);
837 x = ((x >> 4) + x) & 0x0f0f0f0f; 979 x = ((x >> 4) + x) & 0x0f0f0f0f;
838 x *= 0x01010101; 980 x *= 0x01010101;
839 981
840 return x >> 24; 982 return x >> 24;
841 } 983 }
842 984
843 ecb_function_ int ecb_ld32 (uint32_t x) ecb_const; 985 ecb_function_ ecb_const int ecb_ld32 (uint32_t x);
844 ecb_function_ int ecb_ld32 (uint32_t x) 986 ecb_function_ ecb_const int ecb_ld32 (uint32_t x)
845 { 987 {
988#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
989 unsigned long r;
990 _BitScanReverse (&r, x);
991 return (int)r;
992#else
846 int r = 0; 993 int r = 0;
847 994
848 if (x >> 16) { x >>= 16; r += 16; } 995 if (x >> 16) { x >>= 16; r += 16; }
849 if (x >> 8) { x >>= 8; r += 8; } 996 if (x >> 8) { x >>= 8; r += 8; }
850 if (x >> 4) { x >>= 4; r += 4; } 997 if (x >> 4) { x >>= 4; r += 4; }
851 if (x >> 2) { x >>= 2; r += 2; } 998 if (x >> 2) { x >>= 2; r += 2; }
852 if (x >> 1) { r += 1; } 999 if (x >> 1) { r += 1; }
853 1000
854 return r; 1001 return r;
1002#endif
855 } 1003 }
856 1004
857 ecb_function_ int ecb_ld64 (uint64_t x) ecb_const; 1005 ecb_function_ ecb_const int ecb_ld64 (uint64_t x);
858 ecb_function_ int ecb_ld64 (uint64_t x) 1006 ecb_function_ ecb_const int ecb_ld64 (uint64_t x)
859 { 1007 {
1008#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
1009 unsigned long r;
1010 _BitScanReverse64 (&r, x);
1011 return (int)r;
1012#else
860 int r = 0; 1013 int r = 0;
861 1014
862 if (x >> 32) { x >>= 32; r += 32; } 1015 if (x >> 32) { x >>= 32; r += 32; }
863 1016
864 return r + ecb_ld32 (x); 1017 return r + ecb_ld32 (x);
1018#endif
865 } 1019 }
866#endif 1020#endif
867 1021
868ecb_function_ ecb_bool ecb_is_pot32 (uint32_t x) ecb_const; 1022ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x);
869ecb_function_ ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); } 1023ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); }
870ecb_function_ ecb_bool ecb_is_pot64 (uint64_t x) ecb_const; 1024ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x);
871ecb_function_ ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); } 1025ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); }
872 1026
873ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) ecb_const; 1027ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x);
874ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) 1028ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x)
875{ 1029{
876 return ( (x * 0x0802U & 0x22110U) 1030 return ( (x * 0x0802U & 0x22110U)
877 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16; 1031 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16;
878} 1032}
879 1033
880ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) ecb_const; 1034ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x);
881ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) 1035ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x)
882{ 1036{
883 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1); 1037 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1);
884 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2); 1038 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2);
885 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4); 1039 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4);
886 x = ( x >> 8 ) | ( x << 8); 1040 x = ( x >> 8 ) | ( x << 8);
887 1041
888 return x; 1042 return x;
889} 1043}
890 1044
891ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) ecb_const; 1045ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x);
892ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) 1046ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x)
893{ 1047{
894 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1); 1048 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1);
895 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2); 1049 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2);
896 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4); 1050 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4);
897 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8); 1051 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8);
900 return x; 1054 return x;
901} 1055}
902 1056
903/* popcount64 is only available on 64 bit cpus as gcc builtin */ 1057/* popcount64 is only available on 64 bit cpus as gcc builtin */
904/* so for this version we are lazy */ 1058/* so for this version we are lazy */
905ecb_function_ int ecb_popcount64 (uint64_t x) ecb_const; 1059ecb_function_ ecb_const int ecb_popcount64 (uint64_t x);
906ecb_function_ int 1060ecb_function_ ecb_const int
907ecb_popcount64 (uint64_t x) 1061ecb_popcount64 (uint64_t x)
908{ 1062{
909 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32); 1063 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32);
910} 1064}
911 1065
912ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) ecb_const; 1066ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count);
913ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) ecb_const; 1067ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count);
914ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) ecb_const; 1068ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count);
915ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) ecb_const; 1069ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count);
916ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) ecb_const; 1070ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count);
917ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) ecb_const; 1071ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count);
918ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) ecb_const; 1072ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count);
919ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) ecb_const; 1073ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count);
920 1074
921ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); } 1075ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); }
922ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); } 1076ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); }
923ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); } 1077ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); }
924ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); } 1078ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); }
925ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); } 1079ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); }
926ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); } 1080ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); }
927ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); } 1081ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); }
928ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); } 1082ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); }
929 1083
930#if ECB_GCC_VERSION(4,3) 1084#if ECB_GCC_VERSION(4,3) || (ECB_CLANG_BUILTIN(__builtin_bswap32) && ECB_CLANG_BUILTIN(__builtin_bswap64))
1085 #if ECB_GCC_VERSION(4,8) || ECB_CLANG_BUILTIN(__builtin_bswap16)
1086 #define ecb_bswap16(x) __builtin_bswap16 (x)
1087 #else
931 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16) 1088 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16)
1089 #endif
932 #define ecb_bswap32(x) __builtin_bswap32 (x) 1090 #define ecb_bswap32(x) __builtin_bswap32 (x)
933 #define ecb_bswap64(x) __builtin_bswap64 (x) 1091 #define ecb_bswap64(x) __builtin_bswap64 (x)
1092#elif _MSC_VER
1093 #include <stdlib.h>
1094 #define ecb_bswap16(x) ((uint16_t)_byteswap_ushort ((uint16_t)(x)))
1095 #define ecb_bswap32(x) ((uint32_t)_byteswap_ulong ((uint32_t)(x)))
1096 #define ecb_bswap64(x) ((uint64_t)_byteswap_uint64 ((uint64_t)(x)))
934#else 1097#else
935 ecb_function_ uint16_t ecb_bswap16 (uint16_t x) ecb_const; 1098 ecb_function_ ecb_const uint16_t ecb_bswap16 (uint16_t x);
936 ecb_function_ uint16_t 1099 ecb_function_ ecb_const uint16_t
937 ecb_bswap16 (uint16_t x) 1100 ecb_bswap16 (uint16_t x)
938 { 1101 {
939 return ecb_rotl16 (x, 8); 1102 return ecb_rotl16 (x, 8);
940 } 1103 }
941 1104
942 ecb_function_ uint32_t ecb_bswap32 (uint32_t x) ecb_const; 1105 ecb_function_ ecb_const uint32_t ecb_bswap32 (uint32_t x);
943 ecb_function_ uint32_t 1106 ecb_function_ ecb_const uint32_t
944 ecb_bswap32 (uint32_t x) 1107 ecb_bswap32 (uint32_t x)
945 { 1108 {
946 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16); 1109 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16);
947 } 1110 }
948 1111
949 ecb_function_ uint64_t ecb_bswap64 (uint64_t x) ecb_const; 1112 ecb_function_ ecb_const uint64_t ecb_bswap64 (uint64_t x);
950 ecb_function_ uint64_t 1113 ecb_function_ ecb_const uint64_t
951 ecb_bswap64 (uint64_t x) 1114 ecb_bswap64 (uint64_t x)
952 { 1115 {
953 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32); 1116 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32);
954 } 1117 }
955#endif 1118#endif
956 1119
957#if ECB_GCC_VERSION(4,5) 1120#if ECB_GCC_VERSION(4,5) || ECB_CLANG_BUILTIN(__builtin_unreachable)
958 #define ecb_unreachable() __builtin_unreachable () 1121 #define ecb_unreachable() __builtin_unreachable ()
959#else 1122#else
960 /* this seems to work fine, but gcc always emits a warning for it :/ */ 1123 /* this seems to work fine, but gcc always emits a warning for it :/ */
961 ecb_inline void ecb_unreachable (void) ecb_noreturn; 1124 ecb_inline ecb_noreturn void ecb_unreachable (void);
962 ecb_inline void ecb_unreachable (void) { } 1125 ecb_inline ecb_noreturn void ecb_unreachable (void) { }
963#endif 1126#endif
964 1127
965/* try to tell the compiler that some condition is definitely true */ 1128/* try to tell the compiler that some condition is definitely true */
966#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0 1129#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0
967 1130
968ecb_inline unsigned char ecb_byteorder_helper (void) ecb_const; 1131ecb_inline ecb_const uint32_t ecb_byteorder_helper (void);
969ecb_inline unsigned char 1132ecb_inline ecb_const uint32_t
970ecb_byteorder_helper (void) 1133ecb_byteorder_helper (void)
971{ 1134{
972 /* the union code still generates code under pressure in gcc, */ 1135 /* the union code still generates code under pressure in gcc, */
973 /* but less than using pointers, and always seems to */ 1136 /* but less than using pointers, and always seems to */
974 /* successfully return a constant. */ 1137 /* successfully return a constant. */
975 /* the reason why we have this horrible preprocessor mess */ 1138 /* the reason why we have this horrible preprocessor mess */
976 /* is to avoid it in all cases, at least on common architectures */ 1139 /* is to avoid it in all cases, at least on common architectures */
977 /* or when using a recent enough gcc version (>= 4.6) */ 1140 /* or when using a recent enough gcc version (>= 4.6) */
978#if __i386 || __i386__ || _M_X86 || __amd64 || __amd64__ || _M_X64
979 return 0x44;
980#elif __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__ 1141#if (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__) \
1142 || ((__i386 || __i386__ || _M_IX86 || ECB_GCC_AMD64 || ECB_MSVC_AMD64) && !__VOS__)
1143 #define ECB_LITTLE_ENDIAN 1
981 return 0x44; 1144 return 0x44332211;
982#elif __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__ 1145#elif (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__) \
1146 || ((__AARCH64EB__ || __MIPSEB__ || __ARMEB__) && !__VOS__)
1147 #define ECB_BIG_ENDIAN 1
983 return 0x11; 1148 return 0x11223344;
984#else 1149#else
985 union 1150 union
986 { 1151 {
1152 uint8_t c[4];
987 uint32_t i; 1153 uint32_t u;
988 uint8_t c;
989 } u = { 0x11223344 }; 1154 } u = { 0x11, 0x22, 0x33, 0x44 };
990 return u.c; 1155 return u.u;
991#endif 1156#endif
992} 1157}
993 1158
994ecb_inline ecb_bool ecb_big_endian (void) ecb_const; 1159ecb_inline ecb_const ecb_bool ecb_big_endian (void);
995ecb_inline ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11; } 1160ecb_inline ecb_const ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11223344; }
996ecb_inline ecb_bool ecb_little_endian (void) ecb_const; 1161ecb_inline ecb_const ecb_bool ecb_little_endian (void);
997ecb_inline ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44; } 1162ecb_inline ecb_const ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44332211; }
998 1163
999#if ECB_GCC_VERSION(3,0) || ECB_C99 1164#if ECB_GCC_VERSION(3,0) || ECB_C99
1000 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0)) 1165 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0))
1001#else 1166#else
1002 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n))) 1167 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n)))
1003#endif 1168#endif
1004 1169
1005#if __cplusplus 1170#if ECB_CPP
1006 template<typename T> 1171 template<typename T>
1007 static inline T ecb_div_rd (T val, T div) 1172 static inline T ecb_div_rd (T val, T div)
1008 { 1173 {
1009 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div; 1174 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div;
1010 } 1175 }
1027 } 1192 }
1028#else 1193#else
1029 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0])) 1194 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0]))
1030#endif 1195#endif
1031 1196
1197ecb_function_ ecb_const uint32_t ecb_binary16_to_binary32 (uint32_t x);
1198ecb_function_ ecb_const uint32_t
1199ecb_binary16_to_binary32 (uint32_t x)
1200{
1201 unsigned int s = (x & 0x8000) << (31 - 15);
1202 int e = (x >> 10) & 0x001f;
1203 unsigned int m = x & 0x03ff;
1204
1205 if (ecb_expect_false (e == 31))
1206 /* infinity or NaN */
1207 e = 255 - (127 - 15);
1208 else if (ecb_expect_false (!e))
1209 {
1210 if (ecb_expect_true (!m))
1211 /* zero, handled by code below by forcing e to 0 */
1212 e = 0 - (127 - 15);
1213 else
1214 {
1215 /* subnormal, renormalise */
1216 unsigned int s = 10 - ecb_ld32 (m);
1217
1218 m = (m << s) & 0x3ff; /* mask implicit bit */
1219 e -= s - 1;
1220 }
1221 }
1222
1223 /* e and m now are normalised, or zero, (or inf or nan) */
1224 e += 127 - 15;
1225
1226 return s | (e << 23) | (m << (23 - 10));
1227}
1228
1229ecb_function_ ecb_const uint16_t ecb_binary32_to_binary16 (uint32_t x);
1230ecb_function_ ecb_const uint16_t
1231ecb_binary32_to_binary16 (uint32_t x)
1232{
1233 unsigned int s = (x >> 16) & 0x00008000; /* sign bit, the easy part */
1234 unsigned int e = ((x >> 23) & 0x000000ff) - (127 - 15); /* the desired exponent */
1235 unsigned int m = x & 0x007fffff;
1236
1237 x &= 0x7fffffff;
1238
1239 /* if it's within range of binary16 normals, use fast path */
1240 if (ecb_expect_true (0x38800000 <= x && x <= 0x477fefff))
1241 {
1242 /* mantissa round-to-even */
1243 m += 0x00000fff + ((m >> (23 - 10)) & 1);
1244
1245 /* handle overflow */
1246 if (ecb_expect_false (m >= 0x00800000))
1247 {
1248 m >>= 1;
1249 e += 1;
1250 }
1251
1252 return s | (e << 10) | (m >> (23 - 10));
1253 }
1254
1255 /* handle large numbers and infinity */
1256 if (ecb_expect_true (0x477fefff < x && x <= 0x7f800000))
1257 return s | 0x7c00;
1258
1259 /* handle zero, subnormals and small numbers */
1260 if (ecb_expect_true (x < 0x38800000))
1261 {
1262 /* zero */
1263 if (ecb_expect_true (!x))
1264 return s;
1265
1266 /* handle subnormals */
1267
1268 /* too small, will be zero */
1269 if (e < (14 - 24)) /* might not be sharp, but is good enough */
1270 return s;
1271
1272 m |= 0x00800000; /* make implicit bit explicit */
1273
1274 /* very tricky - we need to round to the nearest e (+10) bit value */
1275 {
1276 unsigned int bits = 14 - e;
1277 unsigned int half = (1 << (bits - 1)) - 1;
1278 unsigned int even = (m >> bits) & 1;
1279
1280 /* if this overflows, we will end up with a normalised number */
1281 m = (m + half + even) >> bits;
1282 }
1283
1284 return s | m;
1285 }
1286
1287 /* handle NaNs, preserve leftmost nan bits, but make sure we don't turn them into infinities */
1288 m >>= 13;
1289
1290 return s | 0x7c00 | m | !m;
1291}
1292
1032/*******************************************************************************/ 1293/*******************************************************************************/
1033/* floating point stuff, can be disabled by defining ECB_NO_LIBM */ 1294/* floating point stuff, can be disabled by defining ECB_NO_LIBM */
1034 1295
1035/* basically, everything uses "ieee pure-endian" floating point numbers */ 1296/* basically, everything uses "ieee pure-endian" floating point numbers */
1036/* the only noteworthy exception is ancient armle, which uses order 43218765 */ 1297/* the only noteworthy exception is ancient armle, which uses order 43218765 */
1037#if 0 \ 1298#if 0 \
1038 || __i386 || __i386__ \ 1299 || __i386 || __i386__ \
1039 || __amd64 || __amd64__ || __x86_64 || __x86_64__ \ 1300 || ECB_GCC_AMD64 \
1040 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \ 1301 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \
1041 || defined __arm__ && defined __ARM_EABI__ \
1042 || defined __s390__ || defined __s390x__ \ 1302 || defined __s390__ || defined __s390x__ \
1043 || defined __mips__ \ 1303 || defined __mips__ \
1044 || defined __alpha__ \ 1304 || defined __alpha__ \
1045 || defined __hppa__ \ 1305 || defined __hppa__ \
1046 || defined __ia64__ \ 1306 || defined __ia64__ \
1307 || defined __m68k__ \
1308 || defined __m88k__ \
1309 || defined __sh__ \
1047 || defined _M_IX86 || defined _M_AMD64 || defined _M_IA64 1310 || defined _M_IX86 || defined ECB_MSVC_AMD64 || defined _M_IA64 \
1311 || (defined __arm__ && (defined __ARM_EABI__ || defined __EABI__ || defined __VFP_FP__ || defined _WIN32_WCE || defined __ANDROID__)) \
1312 || defined __aarch64__
1048 #define ECB_STDFP 1 1313 #define ECB_STDFP 1
1049 #include <string.h> /* for memcpy */ 1314 #include <string.h> /* for memcpy */
1050#else 1315#else
1051 #define ECB_STDFP 0 1316 #define ECB_STDFP 0
1052 #include <math.h> /* for frexp*, ldexp* */
1053#endif 1317#endif
1054 1318
1055#ifndef ECB_NO_LIBM 1319#ifndef ECB_NO_LIBM
1056 1320
1321 #include <math.h> /* for frexp*, ldexp*, INFINITY, NAN */
1322
1323 /* only the oldest of old doesn't have this one. solaris. */
1324 #ifdef INFINITY
1325 #define ECB_INFINITY INFINITY
1326 #else
1327 #define ECB_INFINITY HUGE_VAL
1328 #endif
1329
1330 #ifdef NAN
1331 #define ECB_NAN NAN
1332 #else
1333 #define ECB_NAN ECB_INFINITY
1334 #endif
1335
1336 #if ECB_C99 || _XOPEN_VERSION >= 600 || _POSIX_VERSION >= 200112L
1337 #define ecb_ldexpf(x,e) ldexpf ((x), (e))
1338 #define ecb_frexpf(x,e) frexpf ((x), (e))
1339 #else
1340 #define ecb_ldexpf(x,e) (float) ldexp ((double) (x), (e))
1341 #define ecb_frexpf(x,e) (float) frexp ((double) (x), (e))
1342 #endif
1343
1057 /* convert a float to ieee single/binary32 */ 1344 /* convert a float to ieee single/binary32 */
1058 ecb_function_ uint32_t ecb_float_to_binary32 (float x) ecb_const; 1345 ecb_function_ ecb_const uint32_t ecb_float_to_binary32 (float x);
1059 ecb_function_ uint32_t 1346 ecb_function_ ecb_const uint32_t
1060 ecb_float_to_binary32 (float x) 1347 ecb_float_to_binary32 (float x)
1061 { 1348 {
1062 uint32_t r; 1349 uint32_t r;
1063 1350
1064 #if ECB_STDFP 1351 #if ECB_STDFP
1071 if (x == 0e0f ) return 0x00000000U; 1358 if (x == 0e0f ) return 0x00000000U;
1072 if (x > +3.40282346638528860e+38f) return 0x7f800000U; 1359 if (x > +3.40282346638528860e+38f) return 0x7f800000U;
1073 if (x < -3.40282346638528860e+38f) return 0xff800000U; 1360 if (x < -3.40282346638528860e+38f) return 0xff800000U;
1074 if (x != x ) return 0x7fbfffffU; 1361 if (x != x ) return 0x7fbfffffU;
1075 1362
1076 m = frexpf (x, &e) * 0x1000000U; 1363 m = ecb_frexpf (x, &e) * 0x1000000U;
1077 1364
1078 r = m & 0x80000000U; 1365 r = m & 0x80000000U;
1079 1366
1080 if (r) 1367 if (r)
1081 m = -m; 1368 m = -m;
1093 1380
1094 return r; 1381 return r;
1095 } 1382 }
1096 1383
1097 /* converts an ieee single/binary32 to a float */ 1384 /* converts an ieee single/binary32 to a float */
1098 ecb_function_ float ecb_binary32_to_float (uint32_t x) ecb_const; 1385 ecb_function_ ecb_const float ecb_binary32_to_float (uint32_t x);
1099 ecb_function_ float 1386 ecb_function_ ecb_const float
1100 ecb_binary32_to_float (uint32_t x) 1387 ecb_binary32_to_float (uint32_t x)
1101 { 1388 {
1102 float r; 1389 float r;
1103 1390
1104 #if ECB_STDFP 1391 #if ECB_STDFP
1114 x |= 0x800000U; 1401 x |= 0x800000U;
1115 else 1402 else
1116 e = 1; 1403 e = 1;
1117 1404
1118 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */ 1405 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */
1119 r = ldexpf (x * (0.5f / 0x800000U), e - 126); 1406 r = ecb_ldexpf (x * (0.5f / 0x800000U), e - 126);
1120 1407
1121 r = neg ? -r : r; 1408 r = neg ? -r : r;
1122 #endif 1409 #endif
1123 1410
1124 return r; 1411 return r;
1125 } 1412 }
1126 1413
1127 /* convert a double to ieee double/binary64 */ 1414 /* convert a double to ieee double/binary64 */
1128 ecb_function_ uint64_t ecb_double_to_binary64 (double x) ecb_const; 1415 ecb_function_ ecb_const uint64_t ecb_double_to_binary64 (double x);
1129 ecb_function_ uint64_t 1416 ecb_function_ ecb_const uint64_t
1130 ecb_double_to_binary64 (double x) 1417 ecb_double_to_binary64 (double x)
1131 { 1418 {
1132 uint64_t r; 1419 uint64_t r;
1133 1420
1134 #if ECB_STDFP 1421 #if ECB_STDFP
1163 1450
1164 return r; 1451 return r;
1165 } 1452 }
1166 1453
1167 /* converts an ieee double/binary64 to a double */ 1454 /* converts an ieee double/binary64 to a double */
1168 ecb_function_ double ecb_binary64_to_double (uint64_t x) ecb_const; 1455 ecb_function_ ecb_const double ecb_binary64_to_double (uint64_t x);
1169 ecb_function_ double 1456 ecb_function_ ecb_const double
1170 ecb_binary64_to_double (uint64_t x) 1457 ecb_binary64_to_double (uint64_t x)
1171 { 1458 {
1172 double r; 1459 double r;
1173 1460
1174 #if ECB_STDFP 1461 #if ECB_STDFP
1190 1477
1191 r = neg ? -r : r; 1478 r = neg ? -r : r;
1192 #endif 1479 #endif
1193 1480
1194 return r; 1481 return r;
1482 }
1483
1484 /* convert a float to ieee half/binary16 */
1485 ecb_function_ ecb_const uint16_t ecb_float_to_binary16 (float x);
1486 ecb_function_ ecb_const uint16_t
1487 ecb_float_to_binary16 (float x)
1488 {
1489 return ecb_binary32_to_binary16 (ecb_float_to_binary32 (x));
1490 }
1491
1492 /* convert an ieee half/binary16 to float */
1493 ecb_function_ ecb_const float ecb_binary16_to_float (uint16_t x);
1494 ecb_function_ ecb_const float
1495 ecb_binary16_to_float (uint16_t x)
1496 {
1497 return ecb_binary32_to_float (ecb_binary16_to_binary32 (x));
1195 } 1498 }
1196 1499
1197#endif 1500#endif
1198 1501
1199#endif 1502#endif
2095 ev_syserr ("(libev) error creating signal/async pipe"); 2398 ev_syserr ("(libev) error creating signal/async pipe");
2096 2399
2097 fd_intern (fds [0]); 2400 fd_intern (fds [0]);
2098 } 2401 }
2099 2402
2100 fd_intern (fds [1]);
2101
2102 evpipe [0] = fds [0]; 2403 evpipe [0] = fds [0];
2103 2404
2104 if (evpipe [1] < 0) 2405 if (evpipe [1] < 0)
2105 evpipe [1] = fds [1]; /* first call, set write fd */ 2406 evpipe [1] = fds [1]; /* first call, set write fd */
2106 else 2407 else
2111 /* so must not be executed on windows */ 2412 /* so must not be executed on windows */
2112 2413
2113 dup2 (fds [1], evpipe [1]); 2414 dup2 (fds [1], evpipe [1]);
2114 close (fds [1]); 2415 close (fds [1]);
2115 } 2416 }
2417
2418 fd_intern (evpipe [1]);
2116 2419
2117 ev_io_set (&pipe_w, evpipe [0] < 0 ? evpipe [1] : evpipe [0], EV_READ); 2420 ev_io_set (&pipe_w, evpipe [0] < 0 ? evpipe [1] : evpipe [0], EV_READ);
2118 ev_io_start (EV_A_ &pipe_w); 2421 ev_io_start (EV_A_ &pipe_w);
2119 ev_unref (EV_A); /* watcher should not keep loop alive */ 2422 ev_unref (EV_A); /* watcher should not keep loop alive */
2120 } 2423 }
2504{ 2807{
2505 return userdata; 2808 return userdata;
2506} 2809}
2507 2810
2508void 2811void
2509ev_set_invoke_pending_cb (EV_P_ void (*invoke_pending_cb)(EV_P)) EV_THROW 2812ev_set_invoke_pending_cb (EV_P_ ev_loop_callback invoke_pending_cb) EV_THROW
2510{ 2813{
2511 invoke_cb = invoke_pending_cb; 2814 invoke_cb = invoke_pending_cb;
2512} 2815}
2513 2816
2514void 2817void
2746#if EV_USE_INOTIFY 3049#if EV_USE_INOTIFY
2747 infy_fork (EV_A); 3050 infy_fork (EV_A);
2748#endif 3051#endif
2749 3052
2750#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE 3053#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE
2751 if (ev_is_active (&pipe_w)) 3054 if (ev_is_active (&pipe_w) && postfork != 2)
2752 { 3055 {
2753 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */ 3056 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */
2754 3057
2755 ev_ref (EV_A); 3058 ev_ref (EV_A);
2756 ev_io_stop (EV_A_ &pipe_w); 3059 ev_io_stop (EV_A_ &pipe_w);

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines