From 75b42a7eb78aa18427de64593576482faffe992b Mon Sep 17 00:00:00 2001 From: powturbo Date: Thu, 18 Jun 2015 17:39:01 +0200 Subject: [PATCH] BitUnpack: Direct Access/Update, FOR, Delta+FOR, SIMD --- bitunpack.h | 20 +++++++++++--------- 1 file changed, 11 insertions(+), 9 deletions(-) diff --git a/bitunpack.h b/bitunpack.h index 3117c68..be53d19 100644 --- a/bitunpack.h +++ b/bitunpack.h @@ -26,15 +26,17 @@ #ifdef __cplusplus extern "C" { #endif +#include #include "conf.h" -// ---------------- Unpack a previously bit packed (scalar bitpack32 or bipack16) integer array ----------------------------------------------------------------- +// ---------------- Unpack a bit packed integer array -------------------------------------------------------------------------------------- // unpack a bitpacked integer array. Return value = end of packed buffer in -unsigned char *bitunpack16(unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned b); unsigned char *bitunpack32(unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned b); +unsigned char *bitunpack16(unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned b); +unsigned char *bitunpack64(unsigned char *__restrict in, unsigned n, uint64_t *__restrict out, unsigned b); -// ---------------- Direct Access to a single bit packed (see bitpack.h) integer array entry -------------------------------------------------------------------- +// ---------------- Direct Access to a single packed integer array entry -------------------------------------------------------------------- #ifdef __AVX2__ #include #else @@ -42,11 +44,11 @@ unsigned char *bitunpack32(unsigned char *__restrict in, unsigned n, unsigned #define _bzhi_u32(__u, __b) ((__u) & ((1u <<__b)-1)) #endif -// Get a single 32 bits value with index "idx" (or bit index b*idx) from a previously bit packed (scalar bitpack32) integer array +// Get a single 32 bits value with index "idx" (or bit index b*idx) from packed integer array static ALWAYS_INLINE unsigned bitgetx32(unsigned char *__restrict in, unsigned b, unsigned idx) { unsigned bidx = b*idx; return _bzhi_u64( (*(unsigned long long *)((unsigned *)in+(bidx>>5))) >> (bidx&0x1f), b ); } static ALWAYS_INLINE unsigned _bitgetx32(unsigned char *__restrict in, unsigned b, unsigned bidx) { return _bzhi_u64( (*(unsigned long long *)((unsigned *)in+(bidx>>5))) >> (bidx&0x1f), b ); } -// like bitgetx32 but for 16 bits integer array (see scalar bitpack16) +// like bitgetx32 but for 16 bits integer array static ALWAYS_INLINE unsigned bitgetx16(unsigned char *__restrict in, unsigned b, unsigned idx) { unsigned bidx = b*idx; return _bzhi_u32( (*(unsigned *)((unsigned *)in+(bidx>>4))) >> (bidx& 0xf), b ); } static ALWAYS_INLINE unsigned _bitgetx16(unsigned char *__restrict in, unsigned b, unsigned bidx) { return _bzhi_u32( (*(unsigned *)((unsigned *)in+(bidx>>4))) >> (bidx& 0xf), b ); } @@ -54,7 +56,7 @@ static ALWAYS_INLINE unsigned _bitgetx16(unsigned char *__restrict in, unsigned static ALWAYS_INLINE void bitsetx32(unsigned char *__restrict in, unsigned b, unsigned idx, unsigned v) { unsigned bidx = b*idx; unsigned long long *p = (unsigned long long *)((unsigned *)in+(bidx>>5)); *p = ( *p & ~(((1ull<>4) ; *p = ( *p & ~(((1u <