250 lines
17 KiB
C
250 lines
17 KiB
C
//-- "Integer Compression" variable byte (scalar TurboVByte+ SIMD TurboByte) ---------------------------------------------------------------
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
//----------------------------- TurboVByte 'vb':Variable byte + SIMD TurboByte 'v8': array functions -----
|
|
size_t vbbound8( size_t n);
|
|
size_t vbbound16(size_t n);
|
|
size_t vbbound32(size_t n);
|
|
size_t vbbound64(size_t n);
|
|
|
|
// Encoding/Decoding: Return value = end of compressed/decompressed output/input buffer out/in
|
|
|
|
//----------------------- Encoding/Decoding unsorted array with n integer values --------------------------
|
|
unsigned char *vbenc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out); //TurboVByte
|
|
unsigned char *vbdec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out);
|
|
|
|
unsigned char *vbenc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out);
|
|
unsigned char *vbdec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out);
|
|
|
|
unsigned char *vbenc64( uint64_t *__restrict in, unsigned n, unsigned char *__restrict out);
|
|
unsigned char *vbdec64( unsigned char *__restrict in, unsigned n, uint64_t *__restrict out);
|
|
|
|
//-- Get value stored at index idx (idx:0...n-1)
|
|
unsigned short vbgetx16( unsigned char *__restrict in, unsigned idx);
|
|
unsigned vbgetx32( unsigned char *__restrict in, unsigned idx);
|
|
uint64_t vbgetx64( unsigned char *__restrict in, unsigned idx);
|
|
|
|
//-- Search and return index of next value equal to key or n when no key value found
|
|
// ex. unsigned idx;unsigned char *ip; for(idx=0,ip=in;;) { if((idx = vgeteq32(&ip, idx, 4321))>=n) break; printf("found at %u ", idx); }
|
|
unsigned vbgeteq16( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned short key);
|
|
unsigned vbgeteq32( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned key);
|
|
unsigned vbgeteq64( unsigned char **__restrict in, unsigned n, unsigned idx, uint64_t key);
|
|
|
|
//---------------------- Delta encoding/decoding sorted array ---------------------------------------------
|
|
//-- Increasing integer array. out[i] = out[i-1] + in[i]
|
|
unsigned char *vbdenc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *vbddec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
|
|
unsigned char *vbdenc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
unsigned char *vbddec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
|
|
unsigned char *vbdenc64( uint64_t *__restrict in, unsigned n, unsigned char *__restrict out, uint64_t start);
|
|
unsigned char *vbddec64( unsigned char *__restrict in, unsigned n, uint64_t *__restrict out, uint64_t start);
|
|
|
|
//-- Get value stored at index idx (idx:0...n-1)
|
|
unsigned short vbdgetx16( unsigned char *__restrict in, unsigned idx, unsigned short start);
|
|
unsigned vbdgetx32( unsigned char *__restrict in, unsigned idx, unsigned start);
|
|
uint64_t vbdgetx64( unsigned char *__restrict in, unsigned idx, uint64_t start);
|
|
|
|
//-- Search and return index of next value equal to key or n when no key value found
|
|
// ex. unsigned idx;unsigned char *ip; for(idx=0,ip=in;;) { if((idx = vgeteq32(&ip, idx, 4321))>=n) break; printf("found at %u ", idx); }
|
|
unsigned vbdgetgeq16( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned short *key, unsigned short start);
|
|
unsigned vbdgetgeq32( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned *key, unsigned start);
|
|
unsigned vbdgetgeq64( unsigned char **__restrict in, unsigned n, unsigned idx, uint64_t *key, uint64_t start);
|
|
|
|
//-- Strictly increasing (never remaining constant or decreasing) integer array. out[i] = out[i-1] + in[i] + 1
|
|
unsigned char *vbd1enc16(unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *vbd1enc32(unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
unsigned char *vbd1enc64(uint64_t *__restrict in, unsigned n, unsigned char *__restrict out, uint64_t start);
|
|
|
|
unsigned char *vbd1dec16(unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
unsigned char *vbd1dec32(unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
unsigned char *vbd1dec64(unsigned char *__restrict in, unsigned n, uint64_t *__restrict out, uint64_t start);
|
|
|
|
|
|
//-- Get value stored at index idx (idx:0...n-1)
|
|
unsigned short vbd1getx16( unsigned char *__restrict in, unsigned idx, unsigned short start);
|
|
unsigned vbd1getx32( unsigned char *__restrict in, unsigned idx, unsigned start);
|
|
uint64_t vbd1getx64( unsigned char *__restrict in, unsigned idx, uint64_t start);
|
|
|
|
//-- Search and return index of next value equal to key or n when no key value found
|
|
// ex. unsigned idx;unsigned char *ip; for(idx=0,ip=in;;) { if((idx = vgeteq32(&ip, idx, 4321))>=n) break; printf("found at %u ", idx); }
|
|
unsigned vbd1getgeq16( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned short *key, unsigned short start);
|
|
unsigned vbd1getgeq32( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned *key, unsigned start);
|
|
unsigned vbd1getgeq64( unsigned char **__restrict in, unsigned n, unsigned idx, uint64_t *key, uint64_t start);
|
|
|
|
//---------------------- Zigzag encoding/decoding for unsorted integer lists.
|
|
unsigned char *vbzenc8( unsigned char *__restrict in, unsigned n, unsigned char *__restrict out, unsigned char start);
|
|
unsigned char *vbzdec8( unsigned char *__restrict in, unsigned n, unsigned char *__restrict out, unsigned char start);
|
|
|
|
unsigned char *vbzenc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *vbzdec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
|
|
unsigned char *vbzenc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
unsigned char *vbzdec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
|
|
unsigned char *vbzenc64( uint64_t *__restrict in, unsigned n, unsigned char *__restrict out, uint64_t start);
|
|
unsigned char *vbzdec64( unsigned char *__restrict in, unsigned n, uint64_t *__restrict out, uint64_t start);
|
|
|
|
//---------------------- XOR encoding/decoding for unsorted integer lists.
|
|
unsigned char *vbxenc8( unsigned char *__restrict in, unsigned n, unsigned char *__restrict out, unsigned char start);
|
|
unsigned char *vbxdec8( unsigned char *__restrict in, unsigned n, unsigned char *__restrict out, unsigned char start);
|
|
|
|
unsigned char *vbxenc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *vbxdec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
|
|
unsigned char *vbxenc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
unsigned char *vbxdec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
|
|
unsigned char *vbxenc64( uint64_t *__restrict in, unsigned n, unsigned char *__restrict out, uint64_t start);
|
|
unsigned char *vbxdec64( unsigned char *__restrict in, unsigned n, uint64_t *__restrict out, uint64_t start);
|
|
|
|
//---------------------- Delta of delta encoding/decoding for unsorted integer lists.
|
|
unsigned char *vbddenc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *vbdddec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
|
|
unsigned char *vbddenc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
unsigned char *vbdddec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
|
|
unsigned char *vbddenc64( uint64_t *__restrict in, unsigned n, unsigned char *__restrict out, uint64_t start);
|
|
unsigned char *vbdddec64( unsigned char *__restrict in, unsigned n, uint64_t *__restrict out, uint64_t start);
|
|
|
|
//-- Get value stored at index idx (idx:0...n-1)
|
|
unsigned short vbzgetx16( unsigned char *__restrict in, unsigned idx, unsigned short start);
|
|
unsigned vbzgetx32( unsigned char *__restrict in, unsigned idx, unsigned start);
|
|
uint64_t vbzgetx64( unsigned char *__restrict in, unsigned idx, uint64_t start);
|
|
|
|
//-- Search and return index of next value equal to key or n when no key value found
|
|
// ex. unsigned idx;unsigned char *ip; for(idx=0,ip=in;;) { if((idx = vgeteq32(&ip, idx, 4321))>=n) break; printf("found at %u ", idx); }
|
|
/*unsigned vbzgeteq15( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned short key, unsigned start);
|
|
unsigned vbzgeteq16( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned short key, unsigned start);
|
|
unsigned vbzgeteq32( unsigned char **__restrict in, unsigned n, unsigned idx, unsigned key, unsigned start);
|
|
unsigned vbzgeteq64( unsigned char **__restrict in, unsigned n, unsigned idx, uint64_t key, unsigned start);*/
|
|
|
|
//-------------------------- TurboByte (SIMD Group varint) --------------------------------------------------------------
|
|
size_t v8bound16(size_t n);
|
|
size_t v8bound32(size_t n);
|
|
|
|
size_t v8len32(const uint32_t *in, size_t n);
|
|
size_t v8len16(const uint16_t *in, size_t n);
|
|
|
|
unsigned char *v8enc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out); //TurboByte
|
|
unsigned char *v8dec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out);
|
|
|
|
unsigned char *v8enc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out);
|
|
unsigned char *v8dec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out);
|
|
|
|
//------ delta ---------
|
|
unsigned char *v8denc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *v8ddec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
|
|
unsigned char *v8denc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
unsigned char *v8ddec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
|
|
//------ delta 1 -------
|
|
unsigned char *v8d1enc16(unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *v8d1dec16(unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
|
|
unsigned char *v8d1enc32(unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
unsigned char *v8d1dec32(unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
|
|
//------- zigzag -------
|
|
unsigned char *v8zenc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *v8zdec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
|
|
unsigned char *v8zenc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
unsigned char *v8zdec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
|
|
//------- xor ----------
|
|
unsigned char *v8xenc16( unsigned short *__restrict in, unsigned n, unsigned char *__restrict out, unsigned short start);
|
|
unsigned char *v8xenc32( unsigned *__restrict in, unsigned n, unsigned char *__restrict out, unsigned start);
|
|
|
|
unsigned char *v8xdec16( unsigned char *__restrict in, unsigned n, unsigned short *__restrict out, unsigned short start);
|
|
unsigned char *v8xdec32( unsigned char *__restrict in, unsigned n, unsigned *__restrict out, unsigned start);
|
|
|
|
//-------------------------- TurboByte Hybrid (SIMD Group varint) + Bitpacking -------------------------------------------
|
|
size_t v8nenc16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8ndec16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8nenc32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8ndec32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8ndenc16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); // delta
|
|
size_t v8nddec16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8ndenc32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nddec32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nd1enc16(uint16_t *__restrict in, size_t n, unsigned char *__restrict out); // delta 1
|
|
size_t v8nd1dec16(unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8nd1enc32(uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nd1dec32(unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nzenc16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); // zigzag delta
|
|
size_t v8nzdec16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8nzenc32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nzdec32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nxenc16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); // xor
|
|
size_t v8nxdec16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8nxenc32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nxdec32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
//------------- sse / neon ----------------------------------------------------------------------------
|
|
size_t v8nenc128v16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8ndec128v16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8nenc128v32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8ndec128v32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8ndenc128v16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); // delta
|
|
size_t v8nddec128v16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8ndenc128v32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nddec128v32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nd1enc128v16(uint16_t *__restrict in, size_t n, unsigned char *__restrict out); // delta 1
|
|
size_t v8nd1dec128v16(unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8nd1enc128v32(uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nd1dec128v32(unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nzenc128v16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); // zigzag delta
|
|
size_t v8nzdec128v16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8nzenc128v32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nzdec128v32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nxenc128v16( uint16_t *__restrict in, size_t n, unsigned char *__restrict out); // xor
|
|
size_t v8nxdec128v16( unsigned char *__restrict in, size_t n, uint16_t *__restrict out);
|
|
|
|
size_t v8nxenc128v32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nxdec128v32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
//------------- avx2 ------------------------------------------------------------------------------------
|
|
size_t v8nenc256v32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8ndec256v32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8ndenc256v32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nddec256v32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nd1enc256v32(uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nd1dec256v32(unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nzenc256v32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nzdec256v32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
size_t v8nxenc256v32( uint32_t *__restrict in, size_t n, unsigned char *__restrict out);
|
|
size_t v8nxdec256v32( unsigned char *__restrict in, size_t n, uint32_t *__restrict out);
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
|