/** Copyright (C) powturbo 2013-2018 GPL v2 License This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. - homepage : https://sites.google.com/site/powturbo/ - github : https://github.com/powturbo - twitter : https://twitter.com/powturbo - email : powturbo [_AT_] gmail [_DOT_] com **/ // conf.h - config & common #ifndef CONF_H #define CONF_H //------------------------- Compiler ------------------------------------------ #if defined(__GNUC__) #include #define ALIGNED(t,v,n) t v __attribute__ ((aligned (n))) #define ALWAYS_INLINE inline __attribute__((always_inline)) #define NOINLINE __attribute__((noinline)) #define _PACKED __attribute__ ((packed)) #define likely(x) __builtin_expect((x),1) #define unlikely(x) __builtin_expect((x),0) #define popcnt32(_x_) __builtin_popcount(_x_) #define popcnt64(_x_) __builtin_popcountll(_x_) #if defined(__i386__) || defined(__x86_64__) //__bsr32 1:0,2:1,3:1,4:2,5:2,6:2,7:2,8:3,9:3,10:3,11:3,12:3,13:3,14:3,15:3,16:4,17:4,18:4,19:4,20:4,21:4,22:4,23:4,24:4,25:4,26:4,27:4,28:4,29:4,30:4,31:4,32:5 //bsr32: 0:0,1:1,2:2,3:2,4:3,5:3,6:3,7:3,8:4,9:4,10:4,11:4,12:4,13:4,14:4,15:4,16:5,17:5,18:5,19:5,20:5,21:5,22:5,23:5,24:5,25:5,26:5,27:5,28:5,29:5,30:5,31:5,32:6, static inline int __bsr32( int x) { asm("bsr %1,%0" : "=r" (x) : "rm" (x) ); return x; } static inline int bsr32( int x) { int b = -1; asm("bsrl %1,%0" : "+r" (b) : "rm" (x) ); return b + 1; } static inline int bsr64(uint64_t x) { return x?64 - __builtin_clzll(x):0; } static inline unsigned rol32(unsigned x, int s) { asm ("roll %%cl,%0" :"=r" (x) :"0" (x),"c" (s)); return x; } static inline unsigned ror32(unsigned x, int s) { asm ("rorl %%cl,%0" :"=r" (x) :"0" (x),"c" (s)); return x; } static inline uint64_t rol64(uint64_t x, int s) { asm ("rolq %%cl,%0" :"=r" (x) :"0" (x),"c" (s)); return x; } static inline uint64_t ror64(uint64_t x, int s) { asm ("rorq %%cl,%0" :"=r" (x) :"0" (x),"c" (s)); return x; } #else static inline int __bsr32(unsigned x ) { return 31 - __builtin_clz( x); } static inline int bsr32(int x ) { return x?32 - __builtin_clz( x):0; } static inline int bsr64(uint64_t x) { return x?64 - __builtin_clzll(x):0; } static inline unsigned rol32(unsigned x, int s) { return x << s | x >> (32 - s); } static inline unsigned ror32(unsigned x, int s) { return x >> s | x << (32 - s); } static inline unsigned rol64(unsigned x, int s) { return x << s | x >> (64 - s); } static inline unsigned ror64(unsigned x, int s) { return x >> s | x << (64 - s); } #endif #define ctz64(_x_) __builtin_ctzll(_x_) #define ctz32(_x_) __builtin_ctz(_x_) #define clz64(_x_) __builtin_clzll(_x_) #define clz32(_x_) __builtin_clz(_x_) #if __GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 8 #define bswap16(x) __builtin_bswap16(x) #else static inline unsigned short bswap16(unsigned short x) { return __builtin_bswap32(x << 16); } #endif #define bswap32(x) __builtin_bswap32(x) #define bswap64(x) __builtin_bswap64(x) #elif _MSC_VER //---------------------------------------------------- #include #include #if _MSC_VER < 1600 #include "vs/stdint.h" #define __builtin_prefetch(x,a) #define inline __inline #else #include #define __builtin_prefetch(x,a) _mm_prefetch(x, _MM_HINT_NTA) #endif #define ALIGNED(x) __declspec(align(x)) #define ALWAYS_INLINE __forceinline #define NOINLINE __declspec(noinline) #define THREADLOCAL __declspec(thread) #define likely(x) (x) #define unlikely(x) (x) static inline int __bsr32(unsigned x) { unsigned long z=0; _BitScanReverse(&z, x); return z; } static inline int bsr32( unsigned x) { unsigned long z; _BitScanReverse(&z, x); return x?z+1:0; } static inline int ctz32( unsigned x) { unsigned long z; _BitScanForward(&z, x); return x?z:32; } static inline int clz32( unsigned x) { unsigned long z; _BitScanReverse(&z, x); return x?31-z:32; } #ifdef _WIN64 #pragma intrinsic(_BitScanReverse) static inline int bsr64(uint64_t x) { unsigned long z=0; _BitScanReverse64(&z, x); return x?z+1:0; } static inline int ctz64(uint64_t x) { unsigned long z; _BitScanForward64(&z, x); return x?z:64; } static inline int clz64(uint64_t x) { unsigned long z; _BitScanReverse64(&z, x); return x?63-z:64; } #endif #define rol32(x,s) _lrotl(x, s) #define ror32(x,s) _lrotr(x, s) #define bswap16(x) _byteswap_ushort(x) #define bswap32(x) _byteswap_ulong(x) #define bswap64(x) _byteswap_uint64(x) #define popcnt32(x) __popcnt(x) #define popcnt64(x) __popcnt64(x) #define sleep(x) Sleep(x/1000) #define fseeko _fseeki64 #define ftello _ftelli64 #define strcasecmp _stricmp #define strncasecmp _strnicmp #define strtoull _strtoui64 static inline double round(double num) { return (num > 0.0) ? floor(num + 0.5) : ceil(num - 0.5); } #endif #define bsr8(_x_) bsr32(_x_) #define bsr16(_x_) bsr32(_x_) #define ctz8(_x_) ctz32(_x_) #define ctz16(_x_) ctz32(_x_) #define clz8(_x_) (clz32(_x_)-8) #define clz16(_x_) (clz32(_x_)-16) //--------------- Unaligned memory access ------------------------------------- /*# || defined(i386) || defined(_X86_) || defined(__THW_INTEL)*/ #if defined(__i386__) || defined(__x86_64__) || \ defined(_M_IX86) || defined(_M_AMD64) || _MSC_VER ||\ defined(__powerpc__) ||\ defined(__ARM_FEATURE_UNALIGNED) || defined(__aarch64__) || defined(__arm__) ||\ defined(__ARM_ARCH_4__) || defined(__ARM_ARCH_4T__) || \ defined(__ARM_ARCH_5__) || defined(__ARM_ARCH_5T__) || defined(__ARM_ARCH_5TE__) || defined(__ARM_ARCH_5TEJ__) || \ defined(__ARM_ARCH_6__) || defined(__ARM_ARCH_6J__) || defined(__ARM_ARCH_6K__) || defined(__ARM_ARCH_6T2__) || defined(__ARM_ARCH_6Z__) || defined(__ARM_ARCH_6ZK__) #define ctou16(_cp_) (*(unsigned short *)(_cp_)) #define ctou32(_cp_) (*(unsigned *)(_cp_)) #if defined(__i386__) || defined(__x86_64__) || defined(__powerpc__) || defined(_MSC_VER) #define ctou64(_cp_) (*(uint64_t *)(_cp_)) #elif defined(__ARM_FEATURE_UNALIGNED) struct _PACKED longu { uint64_t l; }; #define ctou64(_cp_) ((struct longu *)(_cp_))->l #endif #elif defined(__ARM_ARCH_7__) || defined(__ARM_ARCH_7A__) || defined(__ARM_ARCH_7M__) || defined(__ARM_ARCH_7R__) || defined(__ARM_ARCH_7S__) struct _PACKED shortu { unsigned short s; }; struct _PACKED unsignedu { unsigned u; }; struct _PACKED longu { uint64_t l; }; #define ctou16(_cp_) ((struct shortu *)(_cp_))->s #define ctou32(_cp_) ((struct unsignedu *)(_cp_))->u #define ctou64(_cp_) ((struct longu *)(_cp_))->l #else #error "unknown cpu" #endif #ifdef ctou16 //#define utoc16(_x_,_cp_) ctou16(_cp_) = _x_ #else static inline unsigned short ctou16(void *cp) { unsigned short x; memcpy((void *)&x, cp, (unsigned int)sizeof(x)); return x; } //static inline void utoc16(unsigned short x, void *cp ) { memcpy(cp, &x, sizeof(x)); } #endif #ifdef ctou32 //#define utoc32(_x_,_cp_) ctou32(_cp_) = _x_ #else static inline unsigned ctou32(void *cp) { unsigned x; memcpy(void *)&x, cp, (unsigned int)sizeof(x)); return x; } //static inline void utoc32(unsigned x, void *cp ) { memcpy(cp, &x, sizeof(x)); } #endif #ifdef ctou64 //#define utoc64(_x_,_cp_) ctou64(_cp_) = _x_ #else static inline uint64_t ctou64(void *cp) { uint64_t x; memcpy((void *)&x, cp, (unsigned int)sizeof(x)); return x; } //static inline void utoc64(uint64_t x, void *cp ) { memcpy(cp, &x, sizeof(x)); } #endif #define ctou24(_cp_) (ctou32(_cp_) & 0xffffff) #define ctou48(_cp_) (ctou64(_cp_) & 0xffffffffffffull) #define ctou8(_cp_) (*_cp_) //--------------------- wordsize ---------------------------------------------- #if defined(__64BIT__) || defined(_LP64) || defined(__LP64__) || defined(_WIN64) ||\ defined(__x86_64__) || defined(_M_X64) ||\ defined(__ia64) || defined(_M_IA64) ||\ defined(__aarch64__) ||\ defined(__mips64) ||\ defined(__powerpc64__) || defined(__ppc64__) || defined(__PPC64__) ||\ defined(__s390x__) #define __WORDSIZE 64 #else #define __WORDSIZE 32 #endif #endif //---------------------misc --------------------------------------------------- #define SIZE_ROUNDUP(_n_, _a_) (((size_t)(_n_) + (size_t)((_a_) - 1)) & ~(size_t)((_a_) - 1)) #define ALIGN_DOWN(__ptr, __a) ((void *)((uintptr_t)(__ptr) & ~(uintptr_t)((__a) - 1))) #define TEMPLATE2_(_x_, _y_) _x_##_y_ #define TEMPLATE2(_x_, _y_) TEMPLATE2_(_x_,_y_) #define TEMPLATE3_(_x_,_y_,_z_) _x_##_y_##_z_ #define TEMPLATE3(_x_,_y_,_z_) TEMPLATE3_(_x_, _y_, _z_) //--- NDEBUG ------- #include #ifdef _MSC_VER #ifdef NDEBUG #define AS(expr, fmt, __VA_ARGS__) #define AC(expr, fmt, __VA_ARGS__) if(!(expr)) { fprintf(stderr, fmt, __VA_ARGS__ ); fflush(stderr); abort(); } #define die(fmt, __VA_ARGS__) do { fprintf(stderr, fmt, __VA_ARGS__ ); fflush(stderr); exit(-1); } while(0) #else #define AS(expr, fmt, __VA_ARGS__) if(!(expr)) { fflush(stdout);fprintf(stderr, "%s:%s:%d:", __FILE__, __FUNCTION__, __LINE__); fprintf(stderr, fmt, ,__VA_ARGS__ ); fflush(stderr); abort(); } #define AC(expr, fmt, __VA_ARGS__) if(!(expr)) { fflush(stdout);fprintf(stderr, "%s:%s:%d:", __FILE__, __FUNCTION__, __LINE__); fprintf(stderr, fmt, ,__VA_ARGS__ ); fflush(stderr); abort(); } #define die(fmt, __VA_ARGS__) do { fprintf(stderr, "%s:%s:%d:", __FILE__, __FUNCTION__, __LINE__); fprintf(stderr, fmt, __VA_ARGS__ ); fflush(stderr); exit(-1); } while(0) #endif #else #ifdef NDEBUG #define AS(expr, fmt,args...) #define AC(expr, fmt,args...) if(!(expr)) { fprintf(stderr, fmt, ## args ); fflush(stderr); abort(); } #define die(fmt,args...) do { fprintf(stderr, fmt, ## args ); fflush(stderr); exit(-1); } while(0) #else #define AS(expr, fmt,args...) if(!(expr)) { fflush(stdout);fprintf(stderr, "%s:%s:%d:", __FILE__, __FUNCTION__, __LINE__); fprintf(stderr, fmt, ## args ); fflush(stderr); abort(); } #define AC(expr, fmt,args...) if(!(expr)) { fflush(stdout);fprintf(stderr, "%s:%s:%d:", __FILE__, __FUNCTION__, __LINE__); fprintf(stderr, fmt, ## args ); fflush(stderr); abort(); } #define die(fmt,args...) do { fprintf(stderr, "%s:%s:%d:", __FILE__, __FUNCTION__, __LINE__); fprintf(stderr, fmt, ## args ); fflush(stderr); exit(-1); } while(0) #endif #endif