ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/libev/ev.c
(Generate patch)

Comparing libev/ev.c (file contents):
Revision 1.428 by root, Tue May 8 15:44:09 2012 UTC vs.
Revision 1.479 by root, Sun Dec 20 01:31:17 2015 UTC

1/* 1/*
2 * libev event processing core, watcher management 2 * libev event processing core, watcher management
3 * 3 *
4 * Copyright (c) 2007,2008,2009,2010,2011,2012 Marc Alexander Lehmann <libev@schmorp.de> 4 * Copyright (c) 2007,2008,2009,2010,2011,2012,2013 Marc Alexander Lehmann <libev@schmorp.de>
5 * All rights reserved. 5 * All rights reserved.
6 * 6 *
7 * Redistribution and use in source and binary forms, with or without modifica- 7 * Redistribution and use in source and binary forms, with or without modifica-
8 * tion, are permitted provided that the following conditions are met: 8 * tion, are permitted provided that the following conditions are met:
9 * 9 *
43# include EV_CONFIG_H 43# include EV_CONFIG_H
44# else 44# else
45# include "config.h" 45# include "config.h"
46# endif 46# endif
47 47
48#if HAVE_FLOOR 48# if HAVE_FLOOR
49# ifndef EV_USE_FLOOR 49# ifndef EV_USE_FLOOR
50# define EV_USE_FLOOR 1 50# define EV_USE_FLOOR 1
51# endif
51# endif 52# endif
52#endif
53 53
54# if HAVE_CLOCK_SYSCALL 54# if HAVE_CLOCK_SYSCALL
55# ifndef EV_USE_CLOCK_SYSCALL 55# ifndef EV_USE_CLOCK_SYSCALL
56# define EV_USE_CLOCK_SYSCALL 1 56# define EV_USE_CLOCK_SYSCALL 1
57# ifndef EV_USE_REALTIME 57# ifndef EV_USE_REALTIME
201# include <sys/wait.h> 201# include <sys/wait.h>
202# include <unistd.h> 202# include <unistd.h>
203#else 203#else
204# include <io.h> 204# include <io.h>
205# define WIN32_LEAN_AND_MEAN 205# define WIN32_LEAN_AND_MEAN
206# include <winsock2.h>
206# include <windows.h> 207# include <windows.h>
207# include <winsock2.h>
208# ifndef EV_SELECT_IS_WINSOCKET 208# ifndef EV_SELECT_IS_WINSOCKET
209# define EV_SELECT_IS_WINSOCKET 1 209# define EV_SELECT_IS_WINSOCKET 1
210# endif 210# endif
211# undef EV_AVOID_STDIO 211# undef EV_AVOID_STDIO
212#endif 212#endif
241#elif defined SIGARRAYSIZE 241#elif defined SIGARRAYSIZE
242# define EV_NSIG (SIGARRAYSIZE) /* Assume ary[SIGARRAYSIZE] */ 242# define EV_NSIG (SIGARRAYSIZE) /* Assume ary[SIGARRAYSIZE] */
243#elif defined _sys_nsig 243#elif defined _sys_nsig
244# define EV_NSIG (_sys_nsig) /* Solaris 2.5 */ 244# define EV_NSIG (_sys_nsig) /* Solaris 2.5 */
245#else 245#else
246# error "unable to find value for NSIG, please report" 246# define EV_NSIG (8 * sizeof (sigset_t) + 1)
247/* to make it compile regardless, just remove the above line, */
248/* but consider reporting it, too! :) */
249# define EV_NSIG 65
250#endif 247#endif
251 248
252#ifndef EV_USE_FLOOR 249#ifndef EV_USE_FLOOR
253# define EV_USE_FLOOR 0 250# define EV_USE_FLOOR 0
254#endif 251#endif
255 252
256#ifndef EV_USE_CLOCK_SYSCALL 253#ifndef EV_USE_CLOCK_SYSCALL
257# if __linux && __GLIBC__ >= 2 254# if __linux && __GLIBC__ == 2 && __GLIBC_MINOR__ < 17
258# define EV_USE_CLOCK_SYSCALL EV_FEATURE_OS 255# define EV_USE_CLOCK_SYSCALL EV_FEATURE_OS
259# else 256# else
260# define EV_USE_CLOCK_SYSCALL 0 257# define EV_USE_CLOCK_SYSCALL 0
258# endif
259#endif
260
261#if !(_POSIX_TIMERS > 0)
262# ifndef EV_USE_MONOTONIC
263# define EV_USE_MONOTONIC 0
264# endif
265# ifndef EV_USE_REALTIME
266# define EV_USE_REALTIME 0
261# endif 267# endif
262#endif 268#endif
263 269
264#ifndef EV_USE_MONOTONIC 270#ifndef EV_USE_MONOTONIC
265# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0 271# if defined _POSIX_MONOTONIC_CLOCK && _POSIX_MONOTONIC_CLOCK >= 0
355# define EV_USE_4HEAP EV_FEATURE_DATA 361# define EV_USE_4HEAP EV_FEATURE_DATA
356#endif 362#endif
357 363
358#ifndef EV_HEAP_CACHE_AT 364#ifndef EV_HEAP_CACHE_AT
359# define EV_HEAP_CACHE_AT EV_FEATURE_DATA 365# define EV_HEAP_CACHE_AT EV_FEATURE_DATA
366#endif
367
368#ifdef ANDROID
369/* supposedly, android doesn't typedef fd_mask */
370# undef EV_USE_SELECT
371# define EV_USE_SELECT 0
372/* supposedly, we need to include syscall.h, not sys/syscall.h, so just disable */
373# undef EV_USE_CLOCK_SYSCALL
374# define EV_USE_CLOCK_SYSCALL 0
375#endif
376
377/* aix's poll.h seems to cause lots of trouble */
378#ifdef _AIX
379/* AIX has a completely broken poll.h header */
380# undef EV_USE_POLL
381# define EV_USE_POLL 0
360#endif 382#endif
361 383
362/* on linux, we can use a (slow) syscall to avoid a dependency on pthread, */ 384/* on linux, we can use a (slow) syscall to avoid a dependency on pthread, */
363/* which makes programs even slower. might work on other unices, too. */ 385/* which makes programs even slower. might work on other unices, too. */
364#if EV_USE_CLOCK_SYSCALL 386#if EV_USE_CLOCK_SYSCALL
373# endif 395# endif
374#endif 396#endif
375 397
376/* this block fixes any misconfiguration where we know we run into trouble otherwise */ 398/* this block fixes any misconfiguration where we know we run into trouble otherwise */
377 399
378#ifdef _AIX
379/* AIX has a completely broken poll.h header */
380# undef EV_USE_POLL
381# define EV_USE_POLL 0
382#endif
383
384#ifndef CLOCK_MONOTONIC 400#ifndef CLOCK_MONOTONIC
385# undef EV_USE_MONOTONIC 401# undef EV_USE_MONOTONIC
386# define EV_USE_MONOTONIC 0 402# define EV_USE_MONOTONIC 0
387#endif 403#endif
388 404
409/* some very old inotify.h headers don't have IN_DONT_FOLLOW */ 425/* some very old inotify.h headers don't have IN_DONT_FOLLOW */
410# ifndef IN_DONT_FOLLOW 426# ifndef IN_DONT_FOLLOW
411# undef EV_USE_INOTIFY 427# undef EV_USE_INOTIFY
412# define EV_USE_INOTIFY 0 428# define EV_USE_INOTIFY 0
413# endif 429# endif
414#endif
415
416#if EV_SELECT_IS_WINSOCKET
417# include <winsock.h>
418#endif 430#endif
419 431
420#if EV_USE_EVENTFD 432#if EV_USE_EVENTFD
421/* our minimum requirement is glibc 2.7 which has the stub, but not the header */ 433/* our minimum requirement is glibc 2.7 which has the stub, but not the header */
422# include <stdint.h> 434# include <stdint.h>
479/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */ 491/* the following is ecb.h embedded into libev - use update_ev_c to update from an external copy */
480/* ECB.H BEGIN */ 492/* ECB.H BEGIN */
481/* 493/*
482 * libecb - http://software.schmorp.de/pkg/libecb 494 * libecb - http://software.schmorp.de/pkg/libecb
483 * 495 *
484 * Copyright (©) 2009-2012 Marc Alexander Lehmann <libecb@schmorp.de> 496 * Copyright (©) 2009-2015 Marc Alexander Lehmann <libecb@schmorp.de>
485 * Copyright (©) 2011 Emanuele Giaquinta 497 * Copyright (©) 2011 Emanuele Giaquinta
486 * All rights reserved. 498 * All rights reserved.
487 * 499 *
488 * Redistribution and use in source and binary forms, with or without modifica- 500 * Redistribution and use in source and binary forms, with or without modifica-
489 * tion, are permitted provided that the following conditions are met: 501 * tion, are permitted provided that the following conditions are met:
503 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; 515 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
504 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, 516 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
505 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH- 517 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH-
506 * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED 518 * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
507 * OF THE POSSIBILITY OF SUCH DAMAGE. 519 * OF THE POSSIBILITY OF SUCH DAMAGE.
520 *
521 * Alternatively, the contents of this file may be used under the terms of
522 * the GNU General Public License ("GPL") version 2 or any later version,
523 * in which case the provisions of the GPL are applicable instead of
524 * the above. If you wish to allow the use of your version of this file
525 * only under the terms of the GPL and not to allow others to use your
526 * version of this file under the BSD license, indicate your decision
527 * by deleting the provisions above and replace them with the notice
528 * and other provisions required by the GPL. If you do not delete the
529 * provisions above, a recipient may use your version of this file under
530 * either the BSD or the GPL.
508 */ 531 */
509 532
510#ifndef ECB_H 533#ifndef ECB_H
511#define ECB_H 534#define ECB_H
535
536/* 16 bits major, 16 bits minor */
537#define ECB_VERSION 0x00010005
512 538
513#ifdef _WIN32 539#ifdef _WIN32
514 typedef signed char int8_t; 540 typedef signed char int8_t;
515 typedef unsigned char uint8_t; 541 typedef unsigned char uint8_t;
516 typedef signed short int16_t; 542 typedef signed short int16_t;
522 typedef unsigned long long uint64_t; 548 typedef unsigned long long uint64_t;
523 #else /* _MSC_VER || __BORLANDC__ */ 549 #else /* _MSC_VER || __BORLANDC__ */
524 typedef signed __int64 int64_t; 550 typedef signed __int64 int64_t;
525 typedef unsigned __int64 uint64_t; 551 typedef unsigned __int64 uint64_t;
526 #endif 552 #endif
553 #ifdef _WIN64
554 #define ECB_PTRSIZE 8
555 typedef uint64_t uintptr_t;
556 typedef int64_t intptr_t;
557 #else
558 #define ECB_PTRSIZE 4
559 typedef uint32_t uintptr_t;
560 typedef int32_t intptr_t;
561 #endif
527#else 562#else
528 #include <inttypes.h> 563 #include <inttypes.h>
564 #if (defined INTPTR_MAX ? INTPTR_MAX : ULONG_MAX) > 0xffffffffU
565 #define ECB_PTRSIZE 8
566 #else
567 #define ECB_PTRSIZE 4
568 #endif
569#endif
570
571#define ECB_GCC_AMD64 (__amd64 || __amd64__ || __x86_64 || __x86_64__)
572#define ECB_MSVC_AMD64 (_M_AMD64 || _M_X64)
573
574/* work around x32 idiocy by defining proper macros */
575#if ECB_GCC_AMD64 || ECB_MSVC_AMD64
576 #if _ILP32
577 #define ECB_AMD64_X32 1
578 #else
579 #define ECB_AMD64 1
580 #endif
529#endif 581#endif
530 582
531/* many compilers define _GNUC_ to some versions but then only implement 583/* many compilers define _GNUC_ to some versions but then only implement
532 * what their idiot authors think are the "more important" extensions, 584 * what their idiot authors think are the "more important" extensions,
533 * causing enormous grief in return for some better fake benchmark numbers. 585 * causing enormous grief in return for some better fake benchmark numbers.
534 * or so. 586 * or so.
535 * we try to detect these and simply assume they are not gcc - if they have 587 * we try to detect these and simply assume they are not gcc - if they have
536 * an issue with that they should have done it right in the first place. 588 * an issue with that they should have done it right in the first place.
537 */ 589 */
538#ifndef ECB_GCC_VERSION
539 #if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__ 590#if !defined __GNUC_MINOR__ || defined __INTEL_COMPILER || defined __SUNPRO_C || defined __SUNPRO_CC || defined __llvm__ || defined __clang__
540 #define ECB_GCC_VERSION(major,minor) 0 591 #define ECB_GCC_VERSION(major,minor) 0
541 #else 592#else
542 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor))) 593 #define ECB_GCC_VERSION(major,minor) (__GNUC__ > (major) || (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor)))
543 #endif 594#endif
595
596#define ECB_CLANG_VERSION(major,minor) (__clang_major__ > (major) || (__clang_major__ == (major) && __clang_minor__ >= (minor)))
597
598#if __clang__ && defined __has_builtin
599 #define ECB_CLANG_BUILTIN(x) __has_builtin (x)
600#else
601 #define ECB_CLANG_BUILTIN(x) 0
602#endif
603
604#if __clang__ && defined __has_extension
605 #define ECB_CLANG_EXTENSION(x) __has_extension (x)
606#else
607 #define ECB_CLANG_EXTENSION(x) 0
608#endif
609
610#define ECB_CPP (__cplusplus+0)
611#define ECB_CPP11 (__cplusplus >= 201103L)
612
613#if ECB_CPP
614 #define ECB_C 0
615 #define ECB_STDC_VERSION 0
616#else
617 #define ECB_C 1
618 #define ECB_STDC_VERSION __STDC_VERSION__
619#endif
620
621#define ECB_C99 (ECB_STDC_VERSION >= 199901L)
622#define ECB_C11 (ECB_STDC_VERSION >= 201112L)
623
624#if ECB_CPP
625 #define ECB_EXTERN_C extern "C"
626 #define ECB_EXTERN_C_BEG ECB_EXTERN_C {
627 #define ECB_EXTERN_C_END }
628#else
629 #define ECB_EXTERN_C extern
630 #define ECB_EXTERN_C_BEG
631 #define ECB_EXTERN_C_END
544#endif 632#endif
545 633
546/*****************************************************************************/ 634/*****************************************************************************/
547 635
548/* ECB_NO_THREADS - ecb is not used by multiple threads, ever */ 636/* ECB_NO_THREADS - ecb is not used by multiple threads, ever */
549/* ECB_NO_SMP - ecb might be used in multiple threads, but only on a single cpu */ 637/* ECB_NO_SMP - ecb might be used in multiple threads, but only on a single cpu */
550 638
551#if ECB_NO_THREADS 639#if ECB_NO_THREADS
552# define ECB_NO_SMP 1 640 #define ECB_NO_SMP 1
553#endif 641#endif
554 642
555#if ECB_NO_THREADS || ECB_NO_SMP 643#if ECB_NO_SMP
556 #define ECB_MEMORY_FENCE do { } while (0) 644 #define ECB_MEMORY_FENCE do { } while (0)
645#endif
646
647/* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/compiler_ref/compiler_builtins.html */
648#if __xlC__ && ECB_CPP
649 #include <builtins.h>
650#endif
651
652#if 1400 <= _MSC_VER
653 #include <intrin.h> /* fence functions _ReadBarrier, also bit search functions _BitScanReverse */
557#endif 654#endif
558 655
559#ifndef ECB_MEMORY_FENCE 656#ifndef ECB_MEMORY_FENCE
560 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110 657 #if ECB_GCC_VERSION(2,5) || defined __INTEL_COMPILER || (__llvm__ && __GNUC__) || __SUNPRO_C >= 0x5110 || __SUNPRO_CC >= 0x5110
561 #if __i386 || __i386__ 658 #if __i386 || __i386__
562 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory") 659 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("lock; orb $0, -1(%%esp)" : : : "memory")
563 #define ECB_MEMORY_FENCE_ACQUIRE ECB_MEMORY_FENCE /* non-lock xchg might be enough */ 660 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
564 #define ECB_MEMORY_FENCE_RELEASE do { } while (0) /* unlikely to change in future cpus */ 661 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
565 #elif __amd64 || __amd64__ || __x86_64 || __x86_64__ 662 #elif ECB_GCC_AMD64
566 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory") 663 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mfence" : : : "memory")
567 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("lfence" : : : "memory") 664 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("" : : : "memory")
568 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("sfence") /* play safe - not needed in any current cpu */ 665 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
569 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ 666 #elif __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__
570 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory") 667 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory")
668 #elif defined __ARM_ARCH_2__ \
669 || defined __ARM_ARCH_3__ || defined __ARM_ARCH_3M__ \
670 || defined __ARM_ARCH_4__ || defined __ARM_ARCH_4T__ \
671 || defined __ARM_ARCH_5__ || defined __ARM_ARCH_5E__ \
672 || defined __ARM_ARCH_5T__ || defined __ARM_ARCH_5TE__ \
673 || defined __ARM_ARCH_5TEJ__
674 /* should not need any, unless running old code on newer cpu - arm doesn't support that */
571 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \ 675 #elif defined __ARM_ARCH_6__ || defined __ARM_ARCH_6J__ \
572 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ 676 || defined __ARM_ARCH_6K__ || defined __ARM_ARCH_6ZK__ \
677 || defined __ARM_ARCH_6T2__
573 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory") 678 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mcr p15,0,%0,c7,c10,5" : : "r" (0) : "memory")
574 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \ 679 #elif defined __ARM_ARCH_7__ || defined __ARM_ARCH_7A__ \
575 || defined __ARM_ARCH_7M__ || defined __ARM_ARCH_7R__ 680 || defined __ARM_ARCH_7R__ || defined __ARM_ARCH_7M__
576 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory") 681 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb" : : : "memory")
577 #elif __sparc || __sparc__ 682 #elif __aarch64__
683 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("dmb ish" : : : "memory")
684 #elif (__sparc || __sparc__) && !(__sparc_v8__ || defined __sparcv8)
578 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad | " : : : "memory") 685 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad | #StoreStore | #StoreLoad" : : : "memory")
579 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory") 686 #define ECB_MEMORY_FENCE_ACQUIRE __asm__ __volatile__ ("membar #LoadStore | #LoadLoad" : : : "memory")
580 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore") 687 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("membar #LoadStore | #StoreStore")
581 #elif defined __s390__ || defined __s390x__ 688 #elif defined __s390__ || defined __s390x__
582 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory") 689 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("bcr 15,0" : : : "memory")
583 #elif defined __mips__ 690 #elif defined __mips__
691 /* GNU/Linux emulates sync on mips1 architectures, so we force its use */
692 /* anybody else who still uses mips1 is supposed to send in their version, with detection code. */
584 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("sync" : : : "memory") 693 #define ECB_MEMORY_FENCE __asm__ __volatile__ (".set mips2; sync; .set mips0" : : : "memory")
585 #elif defined __alpha__ 694 #elif defined __alpha__
586 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mb" : : : "memory") 695 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mb" : : : "memory")
696 #elif defined __hppa__
697 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
698 #define ECB_MEMORY_FENCE_RELEASE __asm__ __volatile__ ("")
699 #elif defined __ia64__
700 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("mf" : : : "memory")
701 #elif defined __m68k__
702 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
703 #elif defined __m88k__
704 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("tb1 0,%%r0,128" : : : "memory")
705 #elif defined __sh__
706 #define ECB_MEMORY_FENCE __asm__ __volatile__ ("" : : : "memory")
587 #endif 707 #endif
588 #endif 708 #endif
589#endif 709#endif
590 710
591#ifndef ECB_MEMORY_FENCE 711#ifndef ECB_MEMORY_FENCE
712 #if ECB_GCC_VERSION(4,7)
713 /* see comment below (stdatomic.h) about the C11 memory model. */
714 #define ECB_MEMORY_FENCE __atomic_thread_fence (__ATOMIC_SEQ_CST)
715 #define ECB_MEMORY_FENCE_ACQUIRE __atomic_thread_fence (__ATOMIC_ACQUIRE)
716 #define ECB_MEMORY_FENCE_RELEASE __atomic_thread_fence (__ATOMIC_RELEASE)
717
718 #elif ECB_CLANG_EXTENSION(c_atomic)
719 /* see comment below (stdatomic.h) about the C11 memory model. */
720 #define ECB_MEMORY_FENCE __c11_atomic_thread_fence (__ATOMIC_SEQ_CST)
721 #define ECB_MEMORY_FENCE_ACQUIRE __c11_atomic_thread_fence (__ATOMIC_ACQUIRE)
722 #define ECB_MEMORY_FENCE_RELEASE __c11_atomic_thread_fence (__ATOMIC_RELEASE)
723
592 #if ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__ 724 #elif ECB_GCC_VERSION(4,4) || defined __INTEL_COMPILER || defined __clang__
593 #define ECB_MEMORY_FENCE __sync_synchronize () 725 #define ECB_MEMORY_FENCE __sync_synchronize ()
594 /*#define ECB_MEMORY_FENCE_ACQUIRE ({ char dummy = 0; __sync_lock_test_and_set (&dummy, 1); }) */ 726 #elif _MSC_VER >= 1500 /* VC++ 2008 */
595 /*#define ECB_MEMORY_FENCE_RELEASE ({ char dummy = 1; __sync_lock_release (&dummy ); }) */ 727 /* apparently, microsoft broke all the memory barrier stuff in Visual Studio 2008... */
728 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier)
729 #define ECB_MEMORY_FENCE _ReadWriteBarrier (); MemoryBarrier()
730 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier (); MemoryBarrier() /* according to msdn, _ReadBarrier is not a load fence */
731 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier (); MemoryBarrier()
596 #elif _MSC_VER >= 1400 /* VC++ 2005 */ 732 #elif _MSC_VER >= 1400 /* VC++ 2005 */
597 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier) 733 #pragma intrinsic(_ReadBarrier,_WriteBarrier,_ReadWriteBarrier)
598 #define ECB_MEMORY_FENCE _ReadWriteBarrier () 734 #define ECB_MEMORY_FENCE _ReadWriteBarrier ()
599 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier () /* according to msdn, _ReadBarrier is not a load fence */ 735 #define ECB_MEMORY_FENCE_ACQUIRE _ReadWriteBarrier () /* according to msdn, _ReadBarrier is not a load fence */
600 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier () 736 #define ECB_MEMORY_FENCE_RELEASE _WriteBarrier ()
610 #define ECB_MEMORY_FENCE __sync () 746 #define ECB_MEMORY_FENCE __sync ()
611 #endif 747 #endif
612#endif 748#endif
613 749
614#ifndef ECB_MEMORY_FENCE 750#ifndef ECB_MEMORY_FENCE
751 #if ECB_C11 && !defined __STDC_NO_ATOMICS__
752 /* we assume that these memory fences work on all variables/all memory accesses, */
753 /* not just C11 atomics and atomic accesses */
754 #include <stdatomic.h>
755 /* Unfortunately, neither gcc 4.7 nor clang 3.1 generate any instructions for */
756 /* any fence other than seq_cst, which isn't very efficient for us. */
757 /* Why that is, we don't know - either the C11 memory model is quite useless */
758 /* for most usages, or gcc and clang have a bug */
759 /* I *currently* lean towards the latter, and inefficiently implement */
760 /* all three of ecb's fences as a seq_cst fence */
761 /* Update, gcc-4.8 generates mfence for all c++ fences, but nothing */
762 /* for all __atomic_thread_fence's except seq_cst */
763 #define ECB_MEMORY_FENCE atomic_thread_fence (memory_order_seq_cst)
764 #endif
765#endif
766
767#ifndef ECB_MEMORY_FENCE
615 #if !ECB_AVOID_PTHREADS 768 #if !ECB_AVOID_PTHREADS
616 /* 769 /*
617 * if you get undefined symbol references to pthread_mutex_lock, 770 * if you get undefined symbol references to pthread_mutex_lock,
618 * or failure to find pthread.h, then you should implement 771 * or failure to find pthread.h, then you should implement
619 * the ECB_MEMORY_FENCE operations for your cpu/compiler 772 * the ECB_MEMORY_FENCE operations for your cpu/compiler
637 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE 790 #define ECB_MEMORY_FENCE_RELEASE ECB_MEMORY_FENCE
638#endif 791#endif
639 792
640/*****************************************************************************/ 793/*****************************************************************************/
641 794
642#define ECB_C99 (__STDC_VERSION__ >= 199901L) 795#if ECB_CPP
643
644#if __cplusplus
645 #define ecb_inline static inline 796 #define ecb_inline static inline
646#elif ECB_GCC_VERSION(2,5) 797#elif ECB_GCC_VERSION(2,5)
647 #define ecb_inline static __inline__ 798 #define ecb_inline static __inline__
648#elif ECB_C99 799#elif ECB_C99
649 #define ecb_inline static inline 800 #define ecb_inline static inline
663 814
664#define ECB_CONCAT_(a, b) a ## b 815#define ECB_CONCAT_(a, b) a ## b
665#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b) 816#define ECB_CONCAT(a, b) ECB_CONCAT_(a, b)
666#define ECB_STRINGIFY_(a) # a 817#define ECB_STRINGIFY_(a) # a
667#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a) 818#define ECB_STRINGIFY(a) ECB_STRINGIFY_(a)
819#define ECB_STRINGIFY_EXPR(expr) ((expr), ECB_STRINGIFY_ (expr))
668 820
669#define ecb_function_ ecb_inline 821#define ecb_function_ ecb_inline
670 822
671#if ECB_GCC_VERSION(3,1) 823#if ECB_GCC_VERSION(3,1) || ECB_CLANG_VERSION(2,8)
672 #define ecb_attribute(attrlist) __attribute__(attrlist) 824 #define ecb_attribute(attrlist) __attribute__ (attrlist)
825#else
826 #define ecb_attribute(attrlist)
827#endif
828
829#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_constant_p)
673 #define ecb_is_constant(expr) __builtin_constant_p (expr) 830 #define ecb_is_constant(expr) __builtin_constant_p (expr)
831#else
832 /* possible C11 impl for integral types
833 typedef struct ecb_is_constant_struct ecb_is_constant_struct;
834 #define ecb_is_constant(expr) _Generic ((1 ? (struct ecb_is_constant_struct *)0 : (void *)((expr) - (expr)), ecb_is_constant_struct *: 0, default: 1)) */
835
836 #define ecb_is_constant(expr) 0
837#endif
838
839#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_expect)
674 #define ecb_expect(expr,value) __builtin_expect ((expr),(value)) 840 #define ecb_expect(expr,value) __builtin_expect ((expr),(value))
841#else
842 #define ecb_expect(expr,value) (expr)
843#endif
844
845#if ECB_GCC_VERSION(3,1) || ECB_CLANG_BUILTIN(__builtin_prefetch)
675 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality) 846 #define ecb_prefetch(addr,rw,locality) __builtin_prefetch (addr, rw, locality)
676#else 847#else
677 #define ecb_attribute(attrlist)
678 #define ecb_is_constant(expr) 0
679 #define ecb_expect(expr,value) (expr)
680 #define ecb_prefetch(addr,rw,locality) 848 #define ecb_prefetch(addr,rw,locality)
681#endif 849#endif
682 850
683/* no emulation for ecb_decltype */ 851/* no emulation for ecb_decltype */
684#if ECB_GCC_VERSION(4,5) 852#if ECB_CPP11
853 // older implementations might have problems with decltype(x)::type, work around it
854 template<class T> struct ecb_decltype_t { typedef T type; };
685 #define ecb_decltype(x) __decltype(x) 855 #define ecb_decltype(x) ecb_decltype_t<decltype (x)>::type
686#elif ECB_GCC_VERSION(3,0) 856#elif ECB_GCC_VERSION(3,0) || ECB_CLANG_VERSION(2,8)
687 #define ecb_decltype(x) __typeof(x) 857 #define ecb_decltype(x) __typeof__ (x)
688#endif 858#endif
689 859
860#if _MSC_VER >= 1300
861 #define ecb_deprecated __declspec (deprecated)
862#else
863 #define ecb_deprecated ecb_attribute ((__deprecated__))
864#endif
865
866#if _MSC_VER >= 1500
867 #define ecb_deprecated_message(msg) __declspec (deprecated (msg))
868#elif ECB_GCC_VERSION(4,5)
869 #define ecb_deprecated_message(msg) ecb_attribute ((__deprecated__ (msg))
870#else
871 #define ecb_deprecated_message(msg) ecb_deprecated
872#endif
873
874#if _MSC_VER >= 1400
875 #define ecb_noinline __declspec (noinline)
876#else
690#define ecb_noinline ecb_attribute ((__noinline__)) 877 #define ecb_noinline ecb_attribute ((__noinline__))
691#define ecb_noreturn ecb_attribute ((__noreturn__)) 878#endif
879
692#define ecb_unused ecb_attribute ((__unused__)) 880#define ecb_unused ecb_attribute ((__unused__))
693#define ecb_const ecb_attribute ((__const__)) 881#define ecb_const ecb_attribute ((__const__))
694#define ecb_pure ecb_attribute ((__pure__)) 882#define ecb_pure ecb_attribute ((__pure__))
883
884#if ECB_C11 || __IBMC_NORETURN
885 /* http://www-01.ibm.com/support/knowledgecenter/SSGH3R_13.1.0/com.ibm.xlcpp131.aix.doc/language_ref/noreturn.html */
886 #define ecb_noreturn _Noreturn
887#elif ECB_CPP11
888 #define ecb_noreturn [[noreturn]]
889#elif _MSC_VER >= 1200
890 /* http://msdn.microsoft.com/en-us/library/k6ktzx3s.aspx */
891 #define ecb_noreturn __declspec (noreturn)
892#else
893 #define ecb_noreturn ecb_attribute ((__noreturn__))
894#endif
695 895
696#if ECB_GCC_VERSION(4,3) 896#if ECB_GCC_VERSION(4,3)
697 #define ecb_artificial ecb_attribute ((__artificial__)) 897 #define ecb_artificial ecb_attribute ((__artificial__))
698 #define ecb_hot ecb_attribute ((__hot__)) 898 #define ecb_hot ecb_attribute ((__hot__))
699 #define ecb_cold ecb_attribute ((__cold__)) 899 #define ecb_cold ecb_attribute ((__cold__))
711/* for compatibility to the rest of the world */ 911/* for compatibility to the rest of the world */
712#define ecb_likely(expr) ecb_expect_true (expr) 912#define ecb_likely(expr) ecb_expect_true (expr)
713#define ecb_unlikely(expr) ecb_expect_false (expr) 913#define ecb_unlikely(expr) ecb_expect_false (expr)
714 914
715/* count trailing zero bits and count # of one bits */ 915/* count trailing zero bits and count # of one bits */
716#if ECB_GCC_VERSION(3,4) 916#if ECB_GCC_VERSION(3,4) \
917 || (ECB_CLANG_BUILTIN(__builtin_clz) && ECB_CLANG_BUILTIN(__builtin_clzll) \
918 && ECB_CLANG_BUILTIN(__builtin_ctz) && ECB_CLANG_BUILTIN(__builtin_ctzll) \
919 && ECB_CLANG_BUILTIN(__builtin_popcount))
717 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */ 920 /* we assume int == 32 bit, long == 32 or 64 bit and long long == 64 bit */
718 #define ecb_ld32(x) (__builtin_clz (x) ^ 31) 921 #define ecb_ld32(x) (__builtin_clz (x) ^ 31)
719 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63) 922 #define ecb_ld64(x) (__builtin_clzll (x) ^ 63)
720 #define ecb_ctz32(x) __builtin_ctz (x) 923 #define ecb_ctz32(x) __builtin_ctz (x)
721 #define ecb_ctz64(x) __builtin_ctzll (x) 924 #define ecb_ctz64(x) __builtin_ctzll (x)
722 #define ecb_popcount32(x) __builtin_popcount (x) 925 #define ecb_popcount32(x) __builtin_popcount (x)
723 /* no popcountll */ 926 /* no popcountll */
724#else 927#else
725 ecb_function_ int ecb_ctz32 (uint32_t x) ecb_const; 928 ecb_function_ ecb_const int ecb_ctz32 (uint32_t x);
726 ecb_function_ int 929 ecb_function_ ecb_const int
727 ecb_ctz32 (uint32_t x) 930 ecb_ctz32 (uint32_t x)
728 { 931 {
932#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
933 unsigned long r;
934 _BitScanForward (&r, x);
935 return (int)r;
936#else
729 int r = 0; 937 int r = 0;
730 938
731 x &= ~x + 1; /* this isolates the lowest bit */ 939 x &= ~x + 1; /* this isolates the lowest bit */
732 940
733#if ECB_branchless_on_i386 941#if ECB_branchless_on_i386
743 if (x & 0xff00ff00) r += 8; 951 if (x & 0xff00ff00) r += 8;
744 if (x & 0xffff0000) r += 16; 952 if (x & 0xffff0000) r += 16;
745#endif 953#endif
746 954
747 return r; 955 return r;
956#endif
748 } 957 }
749 958
750 ecb_function_ int ecb_ctz64 (uint64_t x) ecb_const; 959 ecb_function_ ecb_const int ecb_ctz64 (uint64_t x);
751 ecb_function_ int 960 ecb_function_ ecb_const int
752 ecb_ctz64 (uint64_t x) 961 ecb_ctz64 (uint64_t x)
753 { 962 {
963#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
964 unsigned long r;
965 _BitScanForward64 (&r, x);
966 return (int)r;
967#else
754 int shift = x & 0xffffffffU ? 0 : 32; 968 int shift = x & 0xffffffff ? 0 : 32;
755 return ecb_ctz32 (x >> shift) + shift; 969 return ecb_ctz32 (x >> shift) + shift;
970#endif
756 } 971 }
757 972
758 ecb_function_ int ecb_popcount32 (uint32_t x) ecb_const; 973 ecb_function_ ecb_const int ecb_popcount32 (uint32_t x);
759 ecb_function_ int 974 ecb_function_ ecb_const int
760 ecb_popcount32 (uint32_t x) 975 ecb_popcount32 (uint32_t x)
761 { 976 {
762 x -= (x >> 1) & 0x55555555; 977 x -= (x >> 1) & 0x55555555;
763 x = ((x >> 2) & 0x33333333) + (x & 0x33333333); 978 x = ((x >> 2) & 0x33333333) + (x & 0x33333333);
764 x = ((x >> 4) + x) & 0x0f0f0f0f; 979 x = ((x >> 4) + x) & 0x0f0f0f0f;
765 x *= 0x01010101; 980 x *= 0x01010101;
766 981
767 return x >> 24; 982 return x >> 24;
768 } 983 }
769 984
770 ecb_function_ int ecb_ld32 (uint32_t x) ecb_const; 985 ecb_function_ ecb_const int ecb_ld32 (uint32_t x);
771 ecb_function_ int ecb_ld32 (uint32_t x) 986 ecb_function_ ecb_const int ecb_ld32 (uint32_t x)
772 { 987 {
988#if 1400 <= _MSC_VER && (_M_IX86 || _M_X64 || _M_IA64 || _M_ARM)
989 unsigned long r;
990 _BitScanReverse (&r, x);
991 return (int)r;
992#else
773 int r = 0; 993 int r = 0;
774 994
775 if (x >> 16) { x >>= 16; r += 16; } 995 if (x >> 16) { x >>= 16; r += 16; }
776 if (x >> 8) { x >>= 8; r += 8; } 996 if (x >> 8) { x >>= 8; r += 8; }
777 if (x >> 4) { x >>= 4; r += 4; } 997 if (x >> 4) { x >>= 4; r += 4; }
778 if (x >> 2) { x >>= 2; r += 2; } 998 if (x >> 2) { x >>= 2; r += 2; }
779 if (x >> 1) { r += 1; } 999 if (x >> 1) { r += 1; }
780 1000
781 return r; 1001 return r;
1002#endif
782 } 1003 }
783 1004
784 ecb_function_ int ecb_ld64 (uint64_t x) ecb_const; 1005 ecb_function_ ecb_const int ecb_ld64 (uint64_t x);
785 ecb_function_ int ecb_ld64 (uint64_t x) 1006 ecb_function_ ecb_const int ecb_ld64 (uint64_t x)
786 { 1007 {
1008#if 1400 <= _MSC_VER && (_M_X64 || _M_IA64 || _M_ARM)
1009 unsigned long r;
1010 _BitScanReverse64 (&r, x);
1011 return (int)r;
1012#else
787 int r = 0; 1013 int r = 0;
788 1014
789 if (x >> 32) { x >>= 32; r += 32; } 1015 if (x >> 32) { x >>= 32; r += 32; }
790 1016
791 return r + ecb_ld32 (x); 1017 return r + ecb_ld32 (x);
1018#endif
792 } 1019 }
793#endif 1020#endif
794 1021
1022ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x);
1023ecb_function_ ecb_const ecb_bool ecb_is_pot32 (uint32_t x) { return !(x & (x - 1)); }
1024ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x);
1025ecb_function_ ecb_const ecb_bool ecb_is_pot64 (uint64_t x) { return !(x & (x - 1)); }
1026
795ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) ecb_const; 1027ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x);
796ecb_function_ uint8_t ecb_bitrev8 (uint8_t x) 1028ecb_function_ ecb_const uint8_t ecb_bitrev8 (uint8_t x)
797{ 1029{
798 return ( (x * 0x0802U & 0x22110U) 1030 return ( (x * 0x0802U & 0x22110U)
799 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16; 1031 | (x * 0x8020U & 0x88440U)) * 0x10101U >> 16;
800} 1032}
801 1033
802ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) ecb_const; 1034ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x);
803ecb_function_ uint16_t ecb_bitrev16 (uint16_t x) 1035ecb_function_ ecb_const uint16_t ecb_bitrev16 (uint16_t x)
804{ 1036{
805 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1); 1037 x = ((x >> 1) & 0x5555) | ((x & 0x5555) << 1);
806 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2); 1038 x = ((x >> 2) & 0x3333) | ((x & 0x3333) << 2);
807 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4); 1039 x = ((x >> 4) & 0x0f0f) | ((x & 0x0f0f) << 4);
808 x = ( x >> 8 ) | ( x << 8); 1040 x = ( x >> 8 ) | ( x << 8);
809 1041
810 return x; 1042 return x;
811} 1043}
812 1044
813ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) ecb_const; 1045ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x);
814ecb_function_ uint32_t ecb_bitrev32 (uint32_t x) 1046ecb_function_ ecb_const uint32_t ecb_bitrev32 (uint32_t x)
815{ 1047{
816 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1); 1048 x = ((x >> 1) & 0x55555555) | ((x & 0x55555555) << 1);
817 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2); 1049 x = ((x >> 2) & 0x33333333) | ((x & 0x33333333) << 2);
818 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4); 1050 x = ((x >> 4) & 0x0f0f0f0f) | ((x & 0x0f0f0f0f) << 4);
819 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8); 1051 x = ((x >> 8) & 0x00ff00ff) | ((x & 0x00ff00ff) << 8);
822 return x; 1054 return x;
823} 1055}
824 1056
825/* popcount64 is only available on 64 bit cpus as gcc builtin */ 1057/* popcount64 is only available on 64 bit cpus as gcc builtin */
826/* so for this version we are lazy */ 1058/* so for this version we are lazy */
827ecb_function_ int ecb_popcount64 (uint64_t x) ecb_const; 1059ecb_function_ ecb_const int ecb_popcount64 (uint64_t x);
828ecb_function_ int 1060ecb_function_ ecb_const int
829ecb_popcount64 (uint64_t x) 1061ecb_popcount64 (uint64_t x)
830{ 1062{
831 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32); 1063 return ecb_popcount32 (x) + ecb_popcount32 (x >> 32);
832} 1064}
833 1065
834ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) ecb_const; 1066ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count);
835ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) ecb_const; 1067ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count);
836ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) ecb_const; 1068ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count);
837ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) ecb_const; 1069ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count);
838ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) ecb_const; 1070ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count);
839ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) ecb_const; 1071ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count);
840ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) ecb_const; 1072ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count);
841ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) ecb_const; 1073ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count);
842 1074
843ecb_inline uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); } 1075ecb_inline ecb_const uint8_t ecb_rotl8 (uint8_t x, unsigned int count) { return (x >> ( 8 - count)) | (x << count); }
844ecb_inline uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); } 1076ecb_inline ecb_const uint8_t ecb_rotr8 (uint8_t x, unsigned int count) { return (x << ( 8 - count)) | (x >> count); }
845ecb_inline uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); } 1077ecb_inline ecb_const uint16_t ecb_rotl16 (uint16_t x, unsigned int count) { return (x >> (16 - count)) | (x << count); }
846ecb_inline uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); } 1078ecb_inline ecb_const uint16_t ecb_rotr16 (uint16_t x, unsigned int count) { return (x << (16 - count)) | (x >> count); }
847ecb_inline uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); } 1079ecb_inline ecb_const uint32_t ecb_rotl32 (uint32_t x, unsigned int count) { return (x >> (32 - count)) | (x << count); }
848ecb_inline uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); } 1080ecb_inline ecb_const uint32_t ecb_rotr32 (uint32_t x, unsigned int count) { return (x << (32 - count)) | (x >> count); }
849ecb_inline uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); } 1081ecb_inline ecb_const uint64_t ecb_rotl64 (uint64_t x, unsigned int count) { return (x >> (64 - count)) | (x << count); }
850ecb_inline uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); } 1082ecb_inline ecb_const uint64_t ecb_rotr64 (uint64_t x, unsigned int count) { return (x << (64 - count)) | (x >> count); }
851 1083
852#if ECB_GCC_VERSION(4,3) 1084#if ECB_GCC_VERSION(4,3) || (ECB_CLANG_BUILTIN(__builtin_bswap32) && ECB_CLANG_BUILTIN(__builtin_bswap64))
1085 #if ECB_GCC_VERSION(4,8) || ECB_CLANG_BUILTIN(__builtin_bswap16)
1086 #define ecb_bswap16(x) __builtin_bswap16 (x)
1087 #else
853 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16) 1088 #define ecb_bswap16(x) (__builtin_bswap32 (x) >> 16)
1089 #endif
854 #define ecb_bswap32(x) __builtin_bswap32 (x) 1090 #define ecb_bswap32(x) __builtin_bswap32 (x)
855 #define ecb_bswap64(x) __builtin_bswap64 (x) 1091 #define ecb_bswap64(x) __builtin_bswap64 (x)
1092#elif _MSC_VER
1093 #include <stdlib.h>
1094 #define ecb_bswap16(x) ((uint16_t)_byteswap_ushort ((uint16_t)(x)))
1095 #define ecb_bswap32(x) ((uint32_t)_byteswap_ulong ((uint32_t)(x)))
1096 #define ecb_bswap64(x) ((uint64_t)_byteswap_uint64 ((uint64_t)(x)))
856#else 1097#else
857 ecb_function_ uint16_t ecb_bswap16 (uint16_t x) ecb_const; 1098 ecb_function_ ecb_const uint16_t ecb_bswap16 (uint16_t x);
858 ecb_function_ uint16_t 1099 ecb_function_ ecb_const uint16_t
859 ecb_bswap16 (uint16_t x) 1100 ecb_bswap16 (uint16_t x)
860 { 1101 {
861 return ecb_rotl16 (x, 8); 1102 return ecb_rotl16 (x, 8);
862 } 1103 }
863 1104
864 ecb_function_ uint32_t ecb_bswap32 (uint32_t x) ecb_const; 1105 ecb_function_ ecb_const uint32_t ecb_bswap32 (uint32_t x);
865 ecb_function_ uint32_t 1106 ecb_function_ ecb_const uint32_t
866 ecb_bswap32 (uint32_t x) 1107 ecb_bswap32 (uint32_t x)
867 { 1108 {
868 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16); 1109 return (((uint32_t)ecb_bswap16 (x)) << 16) | ecb_bswap16 (x >> 16);
869 } 1110 }
870 1111
871 ecb_function_ uint64_t ecb_bswap64 (uint64_t x) ecb_const; 1112 ecb_function_ ecb_const uint64_t ecb_bswap64 (uint64_t x);
872 ecb_function_ uint64_t 1113 ecb_function_ ecb_const uint64_t
873 ecb_bswap64 (uint64_t x) 1114 ecb_bswap64 (uint64_t x)
874 { 1115 {
875 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32); 1116 return (((uint64_t)ecb_bswap32 (x)) << 32) | ecb_bswap32 (x >> 32);
876 } 1117 }
877#endif 1118#endif
878 1119
879#if ECB_GCC_VERSION(4,5) 1120#if ECB_GCC_VERSION(4,5) || ECB_CLANG_BUILTIN(__builtin_unreachable)
880 #define ecb_unreachable() __builtin_unreachable () 1121 #define ecb_unreachable() __builtin_unreachable ()
881#else 1122#else
882 /* this seems to work fine, but gcc always emits a warning for it :/ */ 1123 /* this seems to work fine, but gcc always emits a warning for it :/ */
883 ecb_inline void ecb_unreachable (void) ecb_noreturn; 1124 ecb_inline ecb_noreturn void ecb_unreachable (void);
884 ecb_inline void ecb_unreachable (void) { } 1125 ecb_inline ecb_noreturn void ecb_unreachable (void) { }
885#endif 1126#endif
886 1127
887/* try to tell the compiler that some condition is definitely true */ 1128/* try to tell the compiler that some condition is definitely true */
888#define ecb_assume(cond) do { if (!(cond)) ecb_unreachable (); } while (0) 1129#define ecb_assume(cond) if (!(cond)) ecb_unreachable (); else 0
889 1130
890ecb_inline unsigned char ecb_byteorder_helper (void) ecb_const; 1131ecb_inline ecb_const uint32_t ecb_byteorder_helper (void);
891ecb_inline unsigned char 1132ecb_inline ecb_const uint32_t
892ecb_byteorder_helper (void) 1133ecb_byteorder_helper (void)
893{ 1134{
894 const uint32_t u = 0x11223344; 1135 /* the union code still generates code under pressure in gcc, */
895 return *(unsigned char *)&u; 1136 /* but less than using pointers, and always seems to */
1137 /* successfully return a constant. */
1138 /* the reason why we have this horrible preprocessor mess */
1139 /* is to avoid it in all cases, at least on common architectures */
1140 /* or when using a recent enough gcc version (>= 4.6) */
1141#if (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__) \
1142 || ((__i386 || __i386__ || _M_IX86 || ECB_GCC_AMD64 || ECB_MSVC_AMD64) && !__VOS__)
1143 #define ECB_LITTLE_ENDIAN 1
1144 return 0x44332211;
1145#elif (defined __BYTE_ORDER__ && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__) \
1146 || ((__AARCH64EB__ || __MIPSEB__ || __ARMEB__) && !__VOS__)
1147 #define ECB_BIG_ENDIAN 1
1148 return 0x11223344;
1149#else
1150 union
1151 {
1152 uint8_t c[4];
1153 uint32_t u;
1154 } u = { 0x11, 0x22, 0x33, 0x44 };
1155 return u.u;
1156#endif
896} 1157}
897 1158
898ecb_inline ecb_bool ecb_big_endian (void) ecb_const; 1159ecb_inline ecb_const ecb_bool ecb_big_endian (void);
899ecb_inline ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11; } 1160ecb_inline ecb_const ecb_bool ecb_big_endian (void) { return ecb_byteorder_helper () == 0x11223344; }
900ecb_inline ecb_bool ecb_little_endian (void) ecb_const; 1161ecb_inline ecb_const ecb_bool ecb_little_endian (void);
901ecb_inline ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44; } 1162ecb_inline ecb_const ecb_bool ecb_little_endian (void) { return ecb_byteorder_helper () == 0x44332211; }
902 1163
903#if ECB_GCC_VERSION(3,0) || ECB_C99 1164#if ECB_GCC_VERSION(3,0) || ECB_C99
904 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0)) 1165 #define ecb_mod(m,n) ((m) % (n) + ((m) % (n) < 0 ? (n) : 0))
905#else 1166#else
906 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n))) 1167 #define ecb_mod(m,n) ((m) < 0 ? ((n) - 1 - ((-1 - (m)) % (n))) : ((m) % (n)))
907#endif 1168#endif
908 1169
909#if __cplusplus 1170#if ECB_CPP
910 template<typename T> 1171 template<typename T>
911 static inline T ecb_div_rd (T val, T div) 1172 static inline T ecb_div_rd (T val, T div)
912 { 1173 {
913 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div; 1174 return val < 0 ? - ((-val + div - 1) / div) : (val ) / div;
914 } 1175 }
931 } 1192 }
932#else 1193#else
933 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0])) 1194 #define ecb_array_length(name) (sizeof (name) / sizeof (name [0]))
934#endif 1195#endif
935 1196
1197ecb_function_ ecb_const uint32_t ecb_binary16_to_binary32 (uint32_t x);
1198ecb_function_ ecb_const uint32_t
1199ecb_binary16_to_binary32 (uint32_t x)
1200{
1201 unsigned int s = (x & 0x8000) << (31 - 15);
1202 int e = (x >> 10) & 0x001f;
1203 unsigned int m = x & 0x03ff;
1204
1205 if (ecb_expect_false (e == 31))
1206 /* infinity or NaN */
1207 e = 255 - (127 - 15);
1208 else if (ecb_expect_false (!e))
1209 {
1210 if (ecb_expect_true (!m))
1211 /* zero, handled by code below by forcing e to 0 */
1212 e = 0 - (127 - 15);
1213 else
1214 {
1215 /* subnormal, renormalise */
1216 unsigned int s = 10 - ecb_ld32 (m);
1217
1218 m = (m << s) & 0x3ff; /* mask implicit bit */
1219 e -= s - 1;
1220 }
1221 }
1222
1223 /* e and m now are normalised, or zero, (or inf or nan) */
1224 e += 127 - 15;
1225
1226 return s | (e << 23) | (m << (23 - 10));
1227}
1228
1229ecb_function_ ecb_const uint16_t ecb_binary32_to_binary16 (uint32_t x);
1230ecb_function_ ecb_const uint16_t
1231ecb_binary32_to_binary16 (uint32_t x)
1232{
1233 unsigned int s = (x >> 16) & 0x00008000; /* sign bit, the easy part */
1234 unsigned int e = ((x >> 23) & 0x000000ff) - (127 - 15); /* the desired exponent */
1235 unsigned int m = x & 0x007fffff;
1236
1237 x &= 0x7fffffff;
1238
1239 /* if it's within range of binary16 normals, use fast path */
1240 if (ecb_expect_true (0x38800000 <= x && x <= 0x477fefff))
1241 {
1242 /* mantissa round-to-even */
1243 m += 0x00000fff + ((m >> (23 - 10)) & 1);
1244
1245 /* handle overflow */
1246 if (ecb_expect_false (m >= 0x00800000))
1247 {
1248 m >>= 1;
1249 e += 1;
1250 }
1251
1252 return s | (e << 10) | (m >> (23 - 10));
1253 }
1254
1255 /* handle large numbers and infinity */
1256 if (ecb_expect_true (0x477fefff < x && x <= 0x7f800000))
1257 return s | 0x7c00;
1258
1259 /* handle zero, subnormals and small numbers */
1260 if (ecb_expect_true (x < 0x38800000))
1261 {
1262 /* zero */
1263 if (ecb_expect_true (!x))
1264 return s;
1265
1266 /* handle subnormals */
1267
1268 /* too small, will be zero */
1269 if (e < (14 - 24)) /* might not be sharp, but is good enough */
1270 return s;
1271
1272 m |= 0x00800000; /* make implicit bit explicit */
1273
1274 /* very tricky - we need to round to the nearest e (+10) bit value */
1275 {
1276 unsigned int bits = 14 - e;
1277 unsigned int half = (1 << (bits - 1)) - 1;
1278 unsigned int even = (m >> bits) & 1;
1279
1280 /* if this overflows, we will end up with a normalised number */
1281 m = (m + half + even) >> bits;
1282 }
1283
1284 return s | m;
1285 }
1286
1287 /* handle NaNs, preserve leftmost nan bits, but make sure we don't turn them into infinities */
1288 m >>= 13;
1289
1290 return s | 0x7c00 | m | !m;
1291}
1292
1293/*******************************************************************************/
1294/* floating point stuff, can be disabled by defining ECB_NO_LIBM */
1295
1296/* basically, everything uses "ieee pure-endian" floating point numbers */
1297/* the only noteworthy exception is ancient armle, which uses order 43218765 */
1298#if 0 \
1299 || __i386 || __i386__ \
1300 || ECB_GCC_AMD64 \
1301 || __powerpc__ || __ppc__ || __powerpc64__ || __ppc64__ \
1302 || defined __s390__ || defined __s390x__ \
1303 || defined __mips__ \
1304 || defined __alpha__ \
1305 || defined __hppa__ \
1306 || defined __ia64__ \
1307 || defined __m68k__ \
1308 || defined __m88k__ \
1309 || defined __sh__ \
1310 || defined _M_IX86 || defined ECB_MSVC_AMD64 || defined _M_IA64 \
1311 || (defined __arm__ && (defined __ARM_EABI__ || defined __EABI__ || defined __VFP_FP__ || defined _WIN32_WCE || defined __ANDROID__)) \
1312 || defined __aarch64__
1313 #define ECB_STDFP 1
1314 #include <string.h> /* for memcpy */
1315#else
1316 #define ECB_STDFP 0
1317#endif
1318
1319#ifndef ECB_NO_LIBM
1320
1321 #include <math.h> /* for frexp*, ldexp*, INFINITY, NAN */
1322
1323 /* only the oldest of old doesn't have this one. solaris. */
1324 #ifdef INFINITY
1325 #define ECB_INFINITY INFINITY
1326 #else
1327 #define ECB_INFINITY HUGE_VAL
1328 #endif
1329
1330 #ifdef NAN
1331 #define ECB_NAN NAN
1332 #else
1333 #define ECB_NAN ECB_INFINITY
1334 #endif
1335
1336 #if ECB_C99 || _XOPEN_VERSION >= 600 || _POSIX_VERSION >= 200112L
1337 #define ecb_ldexpf(x,e) ldexpf ((x), (e))
1338 #define ecb_frexpf(x,e) frexpf ((x), (e))
1339 #else
1340 #define ecb_ldexpf(x,e) (float) ldexp ((double) (x), (e))
1341 #define ecb_frexpf(x,e) (float) frexp ((double) (x), (e))
1342 #endif
1343
1344 /* convert a float to ieee single/binary32 */
1345 ecb_function_ ecb_const uint32_t ecb_float_to_binary32 (float x);
1346 ecb_function_ ecb_const uint32_t
1347 ecb_float_to_binary32 (float x)
1348 {
1349 uint32_t r;
1350
1351 #if ECB_STDFP
1352 memcpy (&r, &x, 4);
1353 #else
1354 /* slow emulation, works for anything but -0 */
1355 uint32_t m;
1356 int e;
1357
1358 if (x == 0e0f ) return 0x00000000U;
1359 if (x > +3.40282346638528860e+38f) return 0x7f800000U;
1360 if (x < -3.40282346638528860e+38f) return 0xff800000U;
1361 if (x != x ) return 0x7fbfffffU;
1362
1363 m = ecb_frexpf (x, &e) * 0x1000000U;
1364
1365 r = m & 0x80000000U;
1366
1367 if (r)
1368 m = -m;
1369
1370 if (e <= -126)
1371 {
1372 m &= 0xffffffU;
1373 m >>= (-125 - e);
1374 e = -126;
1375 }
1376
1377 r |= (e + 126) << 23;
1378 r |= m & 0x7fffffU;
1379 #endif
1380
1381 return r;
1382 }
1383
1384 /* converts an ieee single/binary32 to a float */
1385 ecb_function_ ecb_const float ecb_binary32_to_float (uint32_t x);
1386 ecb_function_ ecb_const float
1387 ecb_binary32_to_float (uint32_t x)
1388 {
1389 float r;
1390
1391 #if ECB_STDFP
1392 memcpy (&r, &x, 4);
1393 #else
1394 /* emulation, only works for normals and subnormals and +0 */
1395 int neg = x >> 31;
1396 int e = (x >> 23) & 0xffU;
1397
1398 x &= 0x7fffffU;
1399
1400 if (e)
1401 x |= 0x800000U;
1402 else
1403 e = 1;
1404
1405 /* we distrust ldexpf a bit and do the 2**-24 scaling by an extra multiply */
1406 r = ecb_ldexpf (x * (0.5f / 0x800000U), e - 126);
1407
1408 r = neg ? -r : r;
1409 #endif
1410
1411 return r;
1412 }
1413
1414 /* convert a double to ieee double/binary64 */
1415 ecb_function_ ecb_const uint64_t ecb_double_to_binary64 (double x);
1416 ecb_function_ ecb_const uint64_t
1417 ecb_double_to_binary64 (double x)
1418 {
1419 uint64_t r;
1420
1421 #if ECB_STDFP
1422 memcpy (&r, &x, 8);
1423 #else
1424 /* slow emulation, works for anything but -0 */
1425 uint64_t m;
1426 int e;
1427
1428 if (x == 0e0 ) return 0x0000000000000000U;
1429 if (x > +1.79769313486231470e+308) return 0x7ff0000000000000U;
1430 if (x < -1.79769313486231470e+308) return 0xfff0000000000000U;
1431 if (x != x ) return 0X7ff7ffffffffffffU;
1432
1433 m = frexp (x, &e) * 0x20000000000000U;
1434
1435 r = m & 0x8000000000000000;;
1436
1437 if (r)
1438 m = -m;
1439
1440 if (e <= -1022)
1441 {
1442 m &= 0x1fffffffffffffU;
1443 m >>= (-1021 - e);
1444 e = -1022;
1445 }
1446
1447 r |= ((uint64_t)(e + 1022)) << 52;
1448 r |= m & 0xfffffffffffffU;
1449 #endif
1450
1451 return r;
1452 }
1453
1454 /* converts an ieee double/binary64 to a double */
1455 ecb_function_ ecb_const double ecb_binary64_to_double (uint64_t x);
1456 ecb_function_ ecb_const double
1457 ecb_binary64_to_double (uint64_t x)
1458 {
1459 double r;
1460
1461 #if ECB_STDFP
1462 memcpy (&r, &x, 8);
1463 #else
1464 /* emulation, only works for normals and subnormals and +0 */
1465 int neg = x >> 63;
1466 int e = (x >> 52) & 0x7ffU;
1467
1468 x &= 0xfffffffffffffU;
1469
1470 if (e)
1471 x |= 0x10000000000000U;
1472 else
1473 e = 1;
1474
1475 /* we distrust ldexp a bit and do the 2**-53 scaling by an extra multiply */
1476 r = ldexp (x * (0.5 / 0x10000000000000U), e - 1022);
1477
1478 r = neg ? -r : r;
1479 #endif
1480
1481 return r;
1482 }
1483
1484 /* convert a float to ieee half/binary16 */
1485 ecb_function_ ecb_const uint16_t ecb_float_to_binary16 (float x);
1486 ecb_function_ ecb_const uint16_t
1487 ecb_float_to_binary16 (float x)
1488 {
1489 return ecb_binary32_to_binary16 (ecb_float_to_binary32 (x));
1490 }
1491
1492 /* convert an ieee half/binary16 to float */
1493 ecb_function_ ecb_const float ecb_binary16_to_float (uint16_t x);
1494 ecb_function_ ecb_const float
1495 ecb_binary16_to_float (uint16_t x)
1496 {
1497 return ecb_binary32_to_float (ecb_binary16_to_binary32 (x));
1498 }
1499
1500#endif
1501
936#endif 1502#endif
937 1503
938/* ECB.H END */ 1504/* ECB.H END */
939 1505
940#if ECB_MEMORY_FENCE_NEEDS_PTHREADS 1506#if ECB_MEMORY_FENCE_NEEDS_PTHREADS
1109#endif 1675#endif
1110 1676
1111static void (*syserr_cb)(const char *msg) EV_THROW; 1677static void (*syserr_cb)(const char *msg) EV_THROW;
1112 1678
1113void ecb_cold 1679void ecb_cold
1114ev_set_syserr_cb (void (*cb)(const char *msg)) EV_THROW 1680ev_set_syserr_cb (void (*cb)(const char *msg) EV_THROW) EV_THROW
1115{ 1681{
1116 syserr_cb = cb; 1682 syserr_cb = cb;
1117} 1683}
1118 1684
1119static void noinline ecb_cold 1685static void noinline ecb_cold
1137 abort (); 1703 abort ();
1138 } 1704 }
1139} 1705}
1140 1706
1141static void * 1707static void *
1142ev_realloc_emul (void *ptr, long size) 1708ev_realloc_emul (void *ptr, long size) EV_THROW
1143{ 1709{
1144#if __GLIBC__
1145 return realloc (ptr, size);
1146#else
1147 /* some systems, notably openbsd and darwin, fail to properly 1710 /* some systems, notably openbsd and darwin, fail to properly
1148 * implement realloc (x, 0) (as required by both ansi c-89 and 1711 * implement realloc (x, 0) (as required by both ansi c-89 and
1149 * the single unix specification, so work around them here. 1712 * the single unix specification, so work around them here.
1713 * recently, also (at least) fedora and debian started breaking it,
1714 * despite documenting it otherwise.
1150 */ 1715 */
1151 1716
1152 if (size) 1717 if (size)
1153 return realloc (ptr, size); 1718 return realloc (ptr, size);
1154 1719
1155 free (ptr); 1720 free (ptr);
1156 return 0; 1721 return 0;
1157#endif
1158} 1722}
1159 1723
1160static void *(*alloc)(void *ptr, long size) EV_THROW = ev_realloc_emul; 1724static void *(*alloc)(void *ptr, long size) EV_THROW = ev_realloc_emul;
1161 1725
1162void ecb_cold 1726void ecb_cold
1163ev_set_allocator (void *(*cb)(void *ptr, long size)) EV_THROW 1727ev_set_allocator (void *(*cb)(void *ptr, long size) EV_THROW) EV_THROW
1164{ 1728{
1165 alloc = cb; 1729 alloc = cb;
1166} 1730}
1167 1731
1168inline_speed void * 1732inline_speed void *
1817static void noinline ecb_cold 2381static void noinline ecb_cold
1818evpipe_init (EV_P) 2382evpipe_init (EV_P)
1819{ 2383{
1820 if (!ev_is_active (&pipe_w)) 2384 if (!ev_is_active (&pipe_w))
1821 { 2385 {
2386 int fds [2];
2387
1822# if EV_USE_EVENTFD 2388# if EV_USE_EVENTFD
2389 fds [0] = -1;
1823 evfd = eventfd (0, EFD_NONBLOCK | EFD_CLOEXEC); 2390 fds [1] = eventfd (0, EFD_NONBLOCK | EFD_CLOEXEC);
1824 if (evfd < 0 && errno == EINVAL) 2391 if (fds [1] < 0 && errno == EINVAL)
1825 evfd = eventfd (0, 0); 2392 fds [1] = eventfd (0, 0);
1826 2393
1827 if (evfd >= 0) 2394 if (fds [1] < 0)
1828 {
1829 evpipe [0] = -1;
1830 fd_intern (evfd); /* doing it twice doesn't hurt */
1831 ev_io_set (&pipe_w, evfd, EV_READ);
1832 }
1833 else
1834# endif 2395# endif
1835 { 2396 {
1836 while (pipe (evpipe)) 2397 while (pipe (fds))
1837 ev_syserr ("(libev) error creating signal/async pipe"); 2398 ev_syserr ("(libev) error creating signal/async pipe");
1838 2399
1839 fd_intern (evpipe [0]); 2400 fd_intern (fds [0]);
1840 fd_intern (evpipe [1]);
1841 ev_io_set (&pipe_w, evpipe [0], EV_READ);
1842 } 2401 }
1843 2402
2403 evpipe [0] = fds [0];
2404
2405 if (evpipe [1] < 0)
2406 evpipe [1] = fds [1]; /* first call, set write fd */
2407 else
2408 {
2409 /* on subsequent calls, do not change evpipe [1] */
2410 /* so that evpipe_write can always rely on its value. */
2411 /* this branch does not do anything sensible on windows, */
2412 /* so must not be executed on windows */
2413
2414 dup2 (fds [1], evpipe [1]);
2415 close (fds [1]);
2416 }
2417
2418 fd_intern (evpipe [1]);
2419
2420 ev_io_set (&pipe_w, evpipe [0] < 0 ? evpipe [1] : evpipe [0], EV_READ);
1844 ev_io_start (EV_A_ &pipe_w); 2421 ev_io_start (EV_A_ &pipe_w);
1845 ev_unref (EV_A); /* watcher should not keep loop alive */ 2422 ev_unref (EV_A); /* watcher should not keep loop alive */
1846 } 2423 }
1847} 2424}
1848 2425
1853 2430
1854 if (expect_true (*flag)) 2431 if (expect_true (*flag))
1855 return; 2432 return;
1856 2433
1857 *flag = 1; 2434 *flag = 1;
1858
1859 ECB_MEMORY_FENCE_RELEASE; /* make sure flag is visible before the wakeup */ 2435 ECB_MEMORY_FENCE_RELEASE; /* make sure flag is visible before the wakeup */
1860 2436
1861 pipe_write_skipped = 1; 2437 pipe_write_skipped = 1;
1862 2438
1863 ECB_MEMORY_FENCE; /* make sure pipe_write_skipped is visible before we check pipe_write_wanted */ 2439 ECB_MEMORY_FENCE; /* make sure pipe_write_skipped is visible before we check pipe_write_wanted */
1864 2440
1865 if (pipe_write_wanted) 2441 if (pipe_write_wanted)
1866 { 2442 {
1867 int old_errno; 2443 int old_errno;
1868 2444
1869 pipe_write_skipped = 0; /* just an optimisation, no fence needed */ 2445 pipe_write_skipped = 0;
2446 ECB_MEMORY_FENCE_RELEASE;
1870 2447
1871 old_errno = errno; /* save errno because write will clobber it */ 2448 old_errno = errno; /* save errno because write will clobber it */
1872 2449
1873#if EV_USE_EVENTFD 2450#if EV_USE_EVENTFD
1874 if (evfd >= 0) 2451 if (evpipe [0] < 0)
1875 { 2452 {
1876 uint64_t counter = 1; 2453 uint64_t counter = 1;
1877 write (evfd, &counter, sizeof (uint64_t)); 2454 write (evpipe [1], &counter, sizeof (uint64_t));
1878 } 2455 }
1879 else 2456 else
1880#endif 2457#endif
1881 { 2458 {
1882#ifdef _WIN32 2459#ifdef _WIN32
1902 int i; 2479 int i;
1903 2480
1904 if (revents & EV_READ) 2481 if (revents & EV_READ)
1905 { 2482 {
1906#if EV_USE_EVENTFD 2483#if EV_USE_EVENTFD
1907 if (evfd >= 0) 2484 if (evpipe [0] < 0)
1908 { 2485 {
1909 uint64_t counter; 2486 uint64_t counter;
1910 read (evfd, &counter, sizeof (uint64_t)); 2487 read (evpipe [1], &counter, sizeof (uint64_t));
1911 } 2488 }
1912 else 2489 else
1913#endif 2490#endif
1914 { 2491 {
1915 char dummy[4]; 2492 char dummy[4];
1916#ifdef _WIN32 2493#ifdef _WIN32
1917 WSABUF buf; 2494 WSABUF buf;
1918 DWORD recvd; 2495 DWORD recvd;
2496 DWORD flags = 0;
1919 buf.buf = dummy; 2497 buf.buf = dummy;
1920 buf.len = sizeof (dummy); 2498 buf.len = sizeof (dummy);
1921 WSARecv (EV_FD_TO_WIN32_HANDLE (evpipe [0]), &buf, 1, &recvd, 0, 0, 0); 2499 WSARecv (EV_FD_TO_WIN32_HANDLE (evpipe [0]), &buf, 1, &recvd, &flags, 0, 0);
1922#else 2500#else
1923 read (evpipe [0], &dummy, sizeof (dummy)); 2501 read (evpipe [0], &dummy, sizeof (dummy));
1924#endif 2502#endif
1925 } 2503 }
1926 } 2504 }
1932#if EV_SIGNAL_ENABLE 2510#if EV_SIGNAL_ENABLE
1933 if (sig_pending) 2511 if (sig_pending)
1934 { 2512 {
1935 sig_pending = 0; 2513 sig_pending = 0;
1936 2514
1937 ECB_MEMORY_FENCE_RELEASE; 2515 ECB_MEMORY_FENCE;
1938 2516
1939 for (i = EV_NSIG - 1; i--; ) 2517 for (i = EV_NSIG - 1; i--; )
1940 if (expect_false (signals [i].pending)) 2518 if (expect_false (signals [i].pending))
1941 ev_feed_signal_event (EV_A_ i + 1); 2519 ev_feed_signal_event (EV_A_ i + 1);
1942 } 2520 }
1945#if EV_ASYNC_ENABLE 2523#if EV_ASYNC_ENABLE
1946 if (async_pending) 2524 if (async_pending)
1947 { 2525 {
1948 async_pending = 0; 2526 async_pending = 0;
1949 2527
1950 ECB_MEMORY_FENCE_RELEASE; 2528 ECB_MEMORY_FENCE;
1951 2529
1952 for (i = asynccnt; i--; ) 2530 for (i = asynccnt; i--; )
1953 if (asyncs [i]->sent) 2531 if (asyncs [i]->sent)
1954 { 2532 {
1955 asyncs [i]->sent = 0; 2533 asyncs [i]->sent = 0;
2534 ECB_MEMORY_FENCE_RELEASE;
1956 ev_feed_event (EV_A_ asyncs [i], EV_ASYNC); 2535 ev_feed_event (EV_A_ asyncs [i], EV_ASYNC);
1957 } 2536 }
1958 } 2537 }
1959#endif 2538#endif
1960} 2539}
1963 2542
1964void 2543void
1965ev_feed_signal (int signum) EV_THROW 2544ev_feed_signal (int signum) EV_THROW
1966{ 2545{
1967#if EV_MULTIPLICITY 2546#if EV_MULTIPLICITY
2547 EV_P;
2548 ECB_MEMORY_FENCE_ACQUIRE;
1968 EV_P = signals [signum - 1].loop; 2549 EV_A = signals [signum - 1].loop;
1969 2550
1970 if (!EV_A) 2551 if (!EV_A)
1971 return; 2552 return;
1972#endif 2553#endif
1973 2554
1974 if (!ev_active (&pipe_w))
1975 return;
1976
1977 signals [signum - 1].pending = 1; 2555 signals [signum - 1].pending = 1;
1978 evpipe_write (EV_A_ &sig_pending); 2556 evpipe_write (EV_A_ &sig_pending);
1979} 2557}
1980 2558
1981static void 2559static void
1991void noinline 2569void noinline
1992ev_feed_signal_event (EV_P_ int signum) EV_THROW 2570ev_feed_signal_event (EV_P_ int signum) EV_THROW
1993{ 2571{
1994 WL w; 2572 WL w;
1995 2573
1996 if (expect_false (signum <= 0 || signum > EV_NSIG)) 2574 if (expect_false (signum <= 0 || signum >= EV_NSIG))
1997 return; 2575 return;
1998 2576
1999 --signum; 2577 --signum;
2000 2578
2001#if EV_MULTIPLICITY 2579#if EV_MULTIPLICITY
2005 if (expect_false (signals [signum].loop != EV_A)) 2583 if (expect_false (signals [signum].loop != EV_A))
2006 return; 2584 return;
2007#endif 2585#endif
2008 2586
2009 signals [signum].pending = 0; 2587 signals [signum].pending = 0;
2588 ECB_MEMORY_FENCE_RELEASE;
2010 2589
2011 for (w = signals [signum].head; w; w = w->next) 2590 for (w = signals [signum].head; w; w = w->next)
2012 ev_feed_event (EV_A_ (W)w, EV_SIGNAL); 2591 ev_feed_event (EV_A_ (W)w, EV_SIGNAL);
2013} 2592}
2014 2593
2228{ 2807{
2229 return userdata; 2808 return userdata;
2230} 2809}
2231 2810
2232void 2811void
2233ev_set_invoke_pending_cb (EV_P_ void (*invoke_pending_cb)(EV_P)) EV_THROW 2812ev_set_invoke_pending_cb (EV_P_ ev_loop_callback invoke_pending_cb) EV_THROW
2234{ 2813{
2235 invoke_cb = invoke_pending_cb; 2814 invoke_cb = invoke_pending_cb;
2236} 2815}
2237 2816
2238void 2817void
2298#if EV_ASYNC_ENABLE 2877#if EV_ASYNC_ENABLE
2299 async_pending = 0; 2878 async_pending = 0;
2300#endif 2879#endif
2301 pipe_write_skipped = 0; 2880 pipe_write_skipped = 0;
2302 pipe_write_wanted = 0; 2881 pipe_write_wanted = 0;
2882 evpipe [0] = -1;
2883 evpipe [1] = -1;
2303#if EV_USE_INOTIFY 2884#if EV_USE_INOTIFY
2304 fs_fd = flags & EVFLAG_NOINOTIFY ? -1 : -2; 2885 fs_fd = flags & EVFLAG_NOINOTIFY ? -1 : -2;
2305#endif 2886#endif
2306#if EV_USE_SIGNALFD 2887#if EV_USE_SIGNALFD
2307 sigfd = flags & EVFLAG_SIGNALFD ? -2 : -1; 2888 sigfd = flags & EVFLAG_SIGNALFD ? -2 : -1;
2358 EV_INVOKE_PENDING; 2939 EV_INVOKE_PENDING;
2359 } 2940 }
2360#endif 2941#endif
2361 2942
2362#if EV_CHILD_ENABLE 2943#if EV_CHILD_ENABLE
2363 if (ev_is_active (&childev)) 2944 if (ev_is_default_loop (EV_A) && ev_is_active (&childev))
2364 { 2945 {
2365 ev_ref (EV_A); /* child watcher */ 2946 ev_ref (EV_A); /* child watcher */
2366 ev_signal_stop (EV_A_ &childev); 2947 ev_signal_stop (EV_A_ &childev);
2367 } 2948 }
2368#endif 2949#endif
2370 if (ev_is_active (&pipe_w)) 2951 if (ev_is_active (&pipe_w))
2371 { 2952 {
2372 /*ev_ref (EV_A);*/ 2953 /*ev_ref (EV_A);*/
2373 /*ev_io_stop (EV_A_ &pipe_w);*/ 2954 /*ev_io_stop (EV_A_ &pipe_w);*/
2374 2955
2375#if EV_USE_EVENTFD
2376 if (evfd >= 0)
2377 close (evfd);
2378#endif
2379
2380 if (evpipe [0] >= 0)
2381 {
2382 EV_WIN32_CLOSE_FD (evpipe [0]); 2956 if (evpipe [0] >= 0) EV_WIN32_CLOSE_FD (evpipe [0]);
2383 EV_WIN32_CLOSE_FD (evpipe [1]); 2957 if (evpipe [1] >= 0) EV_WIN32_CLOSE_FD (evpipe [1]);
2384 }
2385 } 2958 }
2386 2959
2387#if EV_USE_SIGNALFD 2960#if EV_USE_SIGNALFD
2388 if (ev_is_active (&sigfd_w)) 2961 if (ev_is_active (&sigfd_w))
2389 close (sigfd); 2962 close (sigfd);
2475#endif 3048#endif
2476#if EV_USE_INOTIFY 3049#if EV_USE_INOTIFY
2477 infy_fork (EV_A); 3050 infy_fork (EV_A);
2478#endif 3051#endif
2479 3052
3053#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE
2480 if (ev_is_active (&pipe_w)) 3054 if (ev_is_active (&pipe_w) && postfork != 2)
2481 { 3055 {
2482 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */ 3056 /* pipe_write_wanted must be false now, so modifying fd vars should be safe */
2483 3057
2484 ev_ref (EV_A); 3058 ev_ref (EV_A);
2485 ev_io_stop (EV_A_ &pipe_w); 3059 ev_io_stop (EV_A_ &pipe_w);
2486 3060
2487#if EV_USE_EVENTFD
2488 if (evfd >= 0)
2489 close (evfd);
2490#endif
2491
2492 if (evpipe [0] >= 0) 3061 if (evpipe [0] >= 0)
2493 {
2494 EV_WIN32_CLOSE_FD (evpipe [0]); 3062 EV_WIN32_CLOSE_FD (evpipe [0]);
2495 EV_WIN32_CLOSE_FD (evpipe [1]);
2496 }
2497 3063
2498#if EV_SIGNAL_ENABLE || EV_ASYNC_ENABLE
2499 evpipe_init (EV_A); 3064 evpipe_init (EV_A);
2500 /* now iterate over everything, in case we missed something */ 3065 /* iterate over everything, in case we missed something before */
2501 pipecb (EV_A_ &pipe_w, EV_READ); 3066 ev_feed_event (EV_A_ &pipe_w, EV_CUSTOM);
2502#endif
2503 } 3067 }
3068#endif
2504 3069
2505 postfork = 0; 3070 postfork = 0;
2506} 3071}
2507 3072
2508#if EV_MULTIPLICITY 3073#if EV_MULTIPLICITY
2563#if EV_FEATURE_API 3128#if EV_FEATURE_API
2564void ecb_cold 3129void ecb_cold
2565ev_verify (EV_P) EV_THROW 3130ev_verify (EV_P) EV_THROW
2566{ 3131{
2567#if EV_VERIFY 3132#if EV_VERIFY
2568 int i, j; 3133 int i;
2569 WL w, w2; 3134 WL w, w2;
2570 3135
2571 assert (activecnt >= -1); 3136 assert (activecnt >= -1);
2572 3137
2573 assert (fdchangemax >= fdchangecnt); 3138 assert (fdchangemax >= fdchangecnt);
2574 for (i = 0; i < fdchangecnt; ++i) 3139 for (i = 0; i < fdchangecnt; ++i)
2575 assert (("libev: negative fd in fdchanges", fdchanges [i] >= 0)); 3140 assert (("libev: negative fd in fdchanges", fdchanges [i] >= 0));
2576 3141
2577 assert (anfdmax >= 0); 3142 assert (anfdmax >= 0);
2578 for (i = j = 0; i < anfdmax; ++i) 3143 for (i = 0; i < anfdmax; ++i)
3144 {
3145 int j = 0;
3146
2579 for (w = w2 = anfds [i].head; w; w = w->next) 3147 for (w = w2 = anfds [i].head; w; w = w->next)
2580 { 3148 {
2581 verify_watcher (EV_A_ (W)w); 3149 verify_watcher (EV_A_ (W)w);
2582 3150
2583 if (j++ & 1) 3151 if (j++ & 1)
2584 { 3152 {
2585 assert (("libev: io watcher list contains a loop", w != w2)); 3153 assert (("libev: io watcher list contains a loop", w != w2));
2586 w2 = w2->next; 3154 w2 = w2->next;
2587 } 3155 }
2588 3156
2589 assert (("libev: inactive fd watcher on anfd list", ev_active (w) == 1)); 3157 assert (("libev: inactive fd watcher on anfd list", ev_active (w) == 1));
2590 assert (("libev: fd mismatch between watcher and anfd", ((ev_io *)w)->fd == i)); 3158 assert (("libev: fd mismatch between watcher and anfd", ((ev_io *)w)->fd == i));
2591 } 3159 }
3160 }
2592 3161
2593 assert (timermax >= timercnt); 3162 assert (timermax >= timercnt);
2594 verify_heap (EV_A_ timers, timercnt); 3163 verify_heap (EV_A_ timers, timercnt);
2595 3164
2596#if EV_PERIODIC_ENABLE 3165#if EV_PERIODIC_ENABLE
2677} 3246}
2678 3247
2679void 3248void
2680ev_loop_fork (EV_P) EV_THROW 3249ev_loop_fork (EV_P) EV_THROW
2681{ 3250{
2682 postfork = 1; /* must be in line with ev_default_fork */ 3251 postfork = 1;
2683} 3252}
2684 3253
2685/*****************************************************************************/ 3254/*****************************************************************************/
2686 3255
2687void 3256void
2703} 3272}
2704 3273
2705void noinline 3274void noinline
2706ev_invoke_pending (EV_P) 3275ev_invoke_pending (EV_P)
2707{ 3276{
2708 for (pendingpri = NUMPRI; pendingpri--; ) /* pendingpri is modified during the loop */ 3277 pendingpri = NUMPRI;
3278
3279 while (pendingpri) /* pendingpri possibly gets modified in the inner loop */
3280 {
3281 --pendingpri;
3282
2709 while (pendingcnt [pendingpri]) 3283 while (pendingcnt [pendingpri])
2710 { 3284 {
2711 ANPENDING *p = pendings [pendingpri] + --pendingcnt [pendingpri]; 3285 ANPENDING *p = pendings [pendingpri] + --pendingcnt [pendingpri];
2712 3286
2713 p->w->pending = 0; 3287 p->w->pending = 0;
2714 EV_CB_INVOKE (p->w, p->events); 3288 EV_CB_INVOKE (p->w, p->events);
2715 EV_FREQUENT_CHECK; 3289 EV_FREQUENT_CHECK;
2716 } 3290 }
3291 }
2717} 3292}
2718 3293
2719#if EV_IDLE_ENABLE 3294#if EV_IDLE_ENABLE
2720/* make idle watchers pending. this handles the "call-idle */ 3295/* make idle watchers pending. this handles the "call-idle */
2721/* only when higher priorities are idle" logic */ 3296/* only when higher priorities are idle" logic */
2811{ 3386{
2812 EV_FREQUENT_CHECK; 3387 EV_FREQUENT_CHECK;
2813 3388
2814 while (periodiccnt && ANHE_at (periodics [HEAP0]) < ev_rt_now) 3389 while (periodiccnt && ANHE_at (periodics [HEAP0]) < ev_rt_now)
2815 { 3390 {
2816 int feed_count = 0;
2817
2818 do 3391 do
2819 { 3392 {
2820 ev_periodic *w = (ev_periodic *)ANHE_w (periodics [HEAP0]); 3393 ev_periodic *w = (ev_periodic *)ANHE_w (periodics [HEAP0]);
2821 3394
2822 /*assert (("libev: inactive timer on periodic heap detected", ev_is_active (w)));*/ 3395 /*assert (("libev: inactive timer on periodic heap detected", ev_is_active (w)));*/
3081 backend_poll (EV_A_ waittime); 3654 backend_poll (EV_A_ waittime);
3082 assert ((loop_done = EVBREAK_CANCEL, 1)); /* assert for side effect */ 3655 assert ((loop_done = EVBREAK_CANCEL, 1)); /* assert for side effect */
3083 3656
3084 pipe_write_wanted = 0; /* just an optimisation, no fence needed */ 3657 pipe_write_wanted = 0; /* just an optimisation, no fence needed */
3085 3658
3659 ECB_MEMORY_FENCE_ACQUIRE;
3086 if (pipe_write_skipped) 3660 if (pipe_write_skipped)
3087 { 3661 {
3088 assert (("libev: pipe_w not active, but pipe not written", ev_is_active (&pipe_w))); 3662 assert (("libev: pipe_w not active, but pipe not written", ev_is_active (&pipe_w)));
3089 ev_feed_event (EV_A_ &pipe_w, EV_CUSTOM); 3663 ev_feed_event (EV_A_ &pipe_w, EV_CUSTOM);
3090 } 3664 }
3468#if EV_MULTIPLICITY 4042#if EV_MULTIPLICITY
3469 assert (("libev: a signal must not be attached to two different loops", 4043 assert (("libev: a signal must not be attached to two different loops",
3470 !signals [w->signum - 1].loop || signals [w->signum - 1].loop == loop)); 4044 !signals [w->signum - 1].loop || signals [w->signum - 1].loop == loop));
3471 4045
3472 signals [w->signum - 1].loop = EV_A; 4046 signals [w->signum - 1].loop = EV_A;
4047 ECB_MEMORY_FENCE_RELEASE;
3473#endif 4048#endif
3474 4049
3475 EV_FREQUENT_CHECK; 4050 EV_FREQUENT_CHECK;
3476 4051
3477#if EV_USE_SIGNALFD 4052#if EV_USE_SIGNALFD
3632# define EV_INOTIFY_BUFSIZE (sizeof (struct inotify_event) * 2 + NAME_MAX) 4207# define EV_INOTIFY_BUFSIZE (sizeof (struct inotify_event) * 2 + NAME_MAX)
3633 4208
3634static void noinline 4209static void noinline
3635infy_add (EV_P_ ev_stat *w) 4210infy_add (EV_P_ ev_stat *w)
3636{ 4211{
3637 w->wd = inotify_add_watch (fs_fd, w->path, IN_ATTRIB | IN_DELETE_SELF | IN_MOVE_SELF | IN_MODIFY | IN_DONT_FOLLOW | IN_MASK_ADD); 4212 w->wd = inotify_add_watch (fs_fd, w->path,
4213 IN_ATTRIB | IN_DELETE_SELF | IN_MOVE_SELF | IN_MODIFY
4214 | IN_CREATE | IN_DELETE | IN_MOVED_FROM | IN_MOVED_TO
4215 | IN_DONT_FOLLOW | IN_MASK_ADD);
3638 4216
3639 if (w->wd >= 0) 4217 if (w->wd >= 0)
3640 { 4218 {
3641 struct statfs sfs; 4219 struct statfs sfs;
3642 4220
3646 4224
3647 if (!fs_2625) 4225 if (!fs_2625)
3648 w->timer.repeat = w->interval ? w->interval : DEF_STAT_INTERVAL; 4226 w->timer.repeat = w->interval ? w->interval : DEF_STAT_INTERVAL;
3649 else if (!statfs (w->path, &sfs) 4227 else if (!statfs (w->path, &sfs)
3650 && (sfs.f_type == 0x1373 /* devfs */ 4228 && (sfs.f_type == 0x1373 /* devfs */
4229 || sfs.f_type == 0x4006 /* fat */
4230 || sfs.f_type == 0x4d44 /* msdos */
3651 || sfs.f_type == 0xEF53 /* ext2/3 */ 4231 || sfs.f_type == 0xEF53 /* ext2/3 */
4232 || sfs.f_type == 0x72b6 /* jffs2 */
4233 || sfs.f_type == 0x858458f6 /* ramfs */
4234 || sfs.f_type == 0x5346544e /* ntfs */
3652 || sfs.f_type == 0x3153464a /* jfs */ 4235 || sfs.f_type == 0x3153464a /* jfs */
4236 || sfs.f_type == 0x9123683e /* btrfs */
3653 || sfs.f_type == 0x52654973 /* reiser3 */ 4237 || sfs.f_type == 0x52654973 /* reiser3 */
3654 || sfs.f_type == 0x01021994 /* tempfs */ 4238 || sfs.f_type == 0x01021994 /* tmpfs */
3655 || sfs.f_type == 0x58465342 /* xfs */)) 4239 || sfs.f_type == 0x58465342 /* xfs */))
3656 w->timer.repeat = 0.; /* filesystem is local, kernel new enough */ 4240 w->timer.repeat = 0.; /* filesystem is local, kernel new enough */
3657 else 4241 else
3658 w->timer.repeat = w->interval ? w->interval : NFS_STAT_INTERVAL; /* remote, use reduced frequency */ 4242 w->timer.repeat = w->interval ? w->interval : NFS_STAT_INTERVAL; /* remote, use reduced frequency */
3659 } 4243 }

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines