/** Copyright (C) powturbo 2013-2017 GPL v2 License This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. - homepage : https://sites.google.com/site/powturbo/ - github : https://github.com/powturbo - twitter : https://twitter.com/powturbo - email : powturbo [_AT_] gmail [_DOT_] com **/ // bitpack.h - "Integer Compression" Binary Packing header file #ifndef BITPACK_H_ #define BITPACK_H_ #ifdef __cplusplus extern "C" { #endif #include //******************** Bit Packing High Level API - n unlimited *************************************************** size_t bitnpack8( uint8_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitnpack16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitnpack32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitnpack64( uint64_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitndpack8( uint8_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitndpack16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitndpack32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitndpack64( uint64_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitnd1pack8( uint8_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitnd1pack16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitnd1pack32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitnd1pack64( uint64_t *__restrict in, size_t n, unsigned char *__restrict out); size_t bitnunpack8( unsigned char *__restrict in, size_t n, uint8_t *__restrict out); size_t bitnunpack16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out); size_t bitnunpack32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out); size_t bitnunpack64( unsigned char *__restrict in, size_t n, uint64_t *__restrict out); size_t bitndunpack8( unsigned char *__restrict in, size_t n, uint8_t *__restrict out); size_t bitndunpack16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out); size_t bitndunpack32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out); size_t bitndunpack64( unsigned char *__restrict in, size_t n, uint64_t *__restrict out); size_t bitnd1unpack8( unsigned char *__restrict in, size_t n, uint8_t *__restrict out); size_t bitnd1unpack16(unsigned char *__restrict in, size_t n, uint16_t *__restrict out); size_t bitnd1unpack32(unsigned char *__restrict in, size_t n, uint32_t *__restrict out); size_t bitnd1unpack64(unsigned char *__restrict in, size_t n, uint64_t *__restrict out); //******** Bit Packing Low level API **************************************************************** // bipackNN: Pack array with n unsigned (NN bits in[n]) values to the buffer out using nbits per value. Return value = end of compressed buffer out unsigned char *bitpack8( uint8_t *__restrict in, unsigned n, const unsigned char *__restrict out , unsigned b); unsigned char *bitpack16( uint16_t *__restrict in, unsigned n, const unsigned char *__restrict out , unsigned b); unsigned char *bitpack32( uint32_t *__restrict in, unsigned n, const unsigned char *__restrict out , unsigned b); unsigned char *bitpack64( uint64_t *__restrict in, unsigned n, const unsigned char *__restrict out , unsigned b); // delta bit packing unsigned char *bitdpack8( uint8_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint8_t start, unsigned b); unsigned char *bitdpack16( uint16_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint16_t start, unsigned b); unsigned char *bitdpack32( uint32_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint32_t start, unsigned b); unsigned char *bitdpack64( uint64_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint64_t start, unsigned b); unsigned char *bitd1pack8( uint8_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint8_t start, unsigned b); unsigned char *bitd1pack16( uint16_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint16_t start, unsigned b); unsigned char *bitd1pack32( uint32_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint32_t start, unsigned b); unsigned char *bitd1pack64( uint64_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint64_t start, unsigned b); // FOR bit packing : sorted integer array unsigned char *bitfpack8( uint8_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint8_t start, unsigned b); unsigned char *bitfpack16( uint16_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint16_t start, unsigned b); unsigned char *bitfpack32( uint32_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint32_t start, unsigned b); unsigned char *bitfpack64( uint64_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint64_t start, unsigned b); unsigned char *bitf1pack8( uint8_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint8_t start, unsigned b); unsigned char *bitf1pack16( uint16_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint16_t start, unsigned b); unsigned char *bitf1pack32( uint32_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint32_t start, unsigned b); unsigned char *bitf1pack64( uint64_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint64_t start, unsigned b); // zigzag : unsorted integer array unsigned char *bitzpack8( uint8_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint8_t start, unsigned b); unsigned char *bitzpack16( uint16_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint16_t start, unsigned b); unsigned char *bitzpack32( uint32_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint32_t start, unsigned b); unsigned char *bitzpack64( uint64_t *__restrict in, unsigned n, const unsigned char *__restrict out, uint64_t start, unsigned b); //-------------------------------------- SIMD ------------------------------------------------------------------------------------------ // Pack array with 128 unsigned (32 bits in[n]) values to the buffer out using nbits per value. Return value = end of compressed buffer out unsigned char *bitpack128v32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out , unsigned b); unsigned char *bitdpack128v32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start, unsigned b); unsigned char *bitd1pack128v32(unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start, unsigned b); unsigned char *bitzpack128v32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start, unsigned b); unsigned char *bitpack256v32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out , unsigned b); unsigned char *bitdpack256v32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start, unsigned b); unsigned char *bitd1pack256v32(unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start, unsigned b); unsigned char *bitzpack256v32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start, unsigned b); //********************************** Bit Packing : Unpack **************************************************************** // ---------------- Unpack a b-bits packed integer array ------------------------------------------------------------------------------- // unpack a bitpacked integer array. Return value = end of packed buffer in unsigned char *bitunpack8( const unsigned char *__restrict in, unsigned n, uint8_t *__restrict out, unsigned b); unsigned char *bitunpack16( const unsigned char *__restrict in, unsigned n, uint16_t *__restrict out, unsigned b); unsigned char *bitunpack32( const unsigned char *__restrict in, unsigned n, uint32_t *__restrict out, unsigned b); unsigned char *bitunpack64( const unsigned char *__restrict in, unsigned n, uint64_t *__restrict out, unsigned b); // ---------------- Direct Access to a single packed integer array entry -------------------------------------------------------------- #ifndef NTURBOPFOR_DAC #ifdef __AVX2__ #include #define bzhi64(_u_, _b_) _bzhi_u64(_u_, _b_) #define bzhi32(_u_, _b_) _bzhi_u32(_u_, _b_) #else #define bzhi64(_u_, _b_) ((_u_) & ((1ull<<(_b_))-1)) #define bzhi32(_u_, _b_) ((_u_) & ((1u <<(_b_))-1)) #endif #include "conf.h" // Get a single 32 bits value with index "idx" (or bit index b*idx) from packed integer array static ALWAYS_INLINE unsigned bitgetx32(const unsigned char *__restrict in, unsigned idx, unsigned b) { unsigned bidx = b*idx; return bzhi64( ctou64((unsigned *)in+(bidx>>5)) >> (bidx&0x1f), b ); } static ALWAYS_INLINE unsigned _bitgetx32(const unsigned char *__restrict in, unsigned bidx, unsigned b) { return bzhi64( ctou64((unsigned *)in+(bidx>>5)) >> (bidx&0x1f), b ); } // like bitgetx32 but for 16 bits integer array static ALWAYS_INLINE unsigned bitgetx8( const unsigned char *__restrict in, unsigned idx, unsigned b) { unsigned bidx = b*idx; return bzhi32( ctou16((uint16_t *)in+(bidx>>4)) >> (bidx& 0xf), b ); } static ALWAYS_INLINE unsigned _bitgetx8( const unsigned char *__restrict in, unsigned bidx, unsigned b) { return bzhi32( ctou16((uint16_t *)in+(bidx>>4)) >> (bidx& 0xf), b ); } static ALWAYS_INLINE unsigned bitgetx16(const unsigned char *__restrict in, unsigned idx, unsigned b) { unsigned bidx = b*idx; return bzhi32( ctou32((uint32_t *)in+(bidx>>4)) >> (bidx& 0xf), b ); } static ALWAYS_INLINE unsigned _bitgetx16(const unsigned char *__restrict in, unsigned bidx, unsigned b) { return bzhi32( ctou32((unsigned *)in+(bidx>>4)) >> (bidx& 0xf), b ); } // Set a single value with index "idx" static ALWAYS_INLINE void bitsetx16(const unsigned char *__restrict in, unsigned idx, unsigned v, unsigned b) { unsigned bidx = b*idx; unsigned *p = (unsigned *) in+(bidx>>4) ; *p = ( *p & ~(((1u <>5)); *p = ( *p & ~(((1ull<