xref: /freebsd-src/sys/contrib/openzfs/module/zstd/lib/common/bitstream.h (revision c03c5b1c80914ec656fbee84539355d1fad68bf9)
1*c03c5b1cSMartin Matuska /* ******************************************************************
2*c03c5b1cSMartin Matuska  * bitstream
3*c03c5b1cSMartin Matuska  * Part of FSE library
4*c03c5b1cSMartin Matuska  * Copyright (c) 2013-2020, Yann Collet, Facebook, Inc.
5*c03c5b1cSMartin Matuska  *
6*c03c5b1cSMartin Matuska  * You can contact the author at :
7*c03c5b1cSMartin Matuska  * - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
8*c03c5b1cSMartin Matuska  *
9*c03c5b1cSMartin Matuska  * This source code is licensed under both the BSD-style license (found in the
10*c03c5b1cSMartin Matuska  * LICENSE file in the root directory of this source tree) and the GPLv2 (found
11*c03c5b1cSMartin Matuska  * in the COPYING file in the root directory of this source tree).
12*c03c5b1cSMartin Matuska  * You may select, at your option, one of the above-listed licenses.
13*c03c5b1cSMartin Matuska ****************************************************************** */
14*c03c5b1cSMartin Matuska #ifndef BITSTREAM_H_MODULE
15*c03c5b1cSMartin Matuska #define BITSTREAM_H_MODULE
16*c03c5b1cSMartin Matuska 
17*c03c5b1cSMartin Matuska #if defined (__cplusplus)
18*c03c5b1cSMartin Matuska extern "C" {
19*c03c5b1cSMartin Matuska #endif
20*c03c5b1cSMartin Matuska 
21*c03c5b1cSMartin Matuska /*
22*c03c5b1cSMartin Matuska *  This API consists of small unitary functions, which must be inlined for best performance.
23*c03c5b1cSMartin Matuska *  Since link-time-optimization is not available for all compilers,
24*c03c5b1cSMartin Matuska *  these functions are defined into a .h to be included.
25*c03c5b1cSMartin Matuska */
26*c03c5b1cSMartin Matuska 
27*c03c5b1cSMartin Matuska /*-****************************************
28*c03c5b1cSMartin Matuska *  Dependencies
29*c03c5b1cSMartin Matuska ******************************************/
30*c03c5b1cSMartin Matuska #include "mem.h"            /* unaligned access routines */
31*c03c5b1cSMartin Matuska #include "compiler.h"       /* UNLIKELY() */
32*c03c5b1cSMartin Matuska #include "debug.h"          /* assert(), DEBUGLOG(), RAWLOG() */
33*c03c5b1cSMartin Matuska #include "error_private.h"  /* error codes and messages */
34*c03c5b1cSMartin Matuska 
35*c03c5b1cSMartin Matuska 
36*c03c5b1cSMartin Matuska /*=========================================
37*c03c5b1cSMartin Matuska *  Target specific
38*c03c5b1cSMartin Matuska =========================================*/
39*c03c5b1cSMartin Matuska #if defined(__BMI__) && defined(__GNUC__)
40*c03c5b1cSMartin Matuska #  include <immintrin.h>   /* support for bextr (experimental) */
41*c03c5b1cSMartin Matuska #elif defined(__ICCARM__)
42*c03c5b1cSMartin Matuska #  include <intrinsics.h>
43*c03c5b1cSMartin Matuska #endif
44*c03c5b1cSMartin Matuska 
45*c03c5b1cSMartin Matuska #define STREAM_ACCUMULATOR_MIN_32  25
46*c03c5b1cSMartin Matuska #define STREAM_ACCUMULATOR_MIN_64  57
47*c03c5b1cSMartin Matuska #define STREAM_ACCUMULATOR_MIN    ((U32)(MEM_32bits() ? STREAM_ACCUMULATOR_MIN_32 : STREAM_ACCUMULATOR_MIN_64))
48*c03c5b1cSMartin Matuska 
49*c03c5b1cSMartin Matuska 
50*c03c5b1cSMartin Matuska /*-******************************************
51*c03c5b1cSMartin Matuska *  bitStream encoding API (write forward)
52*c03c5b1cSMartin Matuska ********************************************/
53*c03c5b1cSMartin Matuska /* bitStream can mix input from multiple sources.
54*c03c5b1cSMartin Matuska  * A critical property of these streams is that they encode and decode in **reverse** direction.
55*c03c5b1cSMartin Matuska  * So the first bit sequence you add will be the last to be read, like a LIFO stack.
56*c03c5b1cSMartin Matuska  */
57*c03c5b1cSMartin Matuska typedef struct {
58*c03c5b1cSMartin Matuska     size_t bitContainer;
59*c03c5b1cSMartin Matuska     unsigned bitPos;
60*c03c5b1cSMartin Matuska     char*  startPtr;
61*c03c5b1cSMartin Matuska     char*  ptr;
62*c03c5b1cSMartin Matuska     char*  endPtr;
63*c03c5b1cSMartin Matuska } BIT_CStream_t;
64*c03c5b1cSMartin Matuska 
65*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_initCStream(BIT_CStream_t* bitC, void* dstBuffer, size_t dstCapacity);
66*c03c5b1cSMartin Matuska MEM_STATIC void   BIT_addBits(BIT_CStream_t* bitC, size_t value, unsigned nbBits);
67*c03c5b1cSMartin Matuska MEM_STATIC void   BIT_flushBits(BIT_CStream_t* bitC);
68*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_closeCStream(BIT_CStream_t* bitC);
69*c03c5b1cSMartin Matuska 
70*c03c5b1cSMartin Matuska /* Start with initCStream, providing the size of buffer to write into.
71*c03c5b1cSMartin Matuska *  bitStream will never write outside of this buffer.
72*c03c5b1cSMartin Matuska *  `dstCapacity` must be >= sizeof(bitD->bitContainer), otherwise @return will be an error code.
73*c03c5b1cSMartin Matuska *
74*c03c5b1cSMartin Matuska *  bits are first added to a local register.
75*c03c5b1cSMartin Matuska *  Local register is size_t, hence 64-bits on 64-bits systems, or 32-bits on 32-bits systems.
76*c03c5b1cSMartin Matuska *  Writing data into memory is an explicit operation, performed by the flushBits function.
77*c03c5b1cSMartin Matuska *  Hence keep track how many bits are potentially stored into local register to avoid register overflow.
78*c03c5b1cSMartin Matuska *  After a flushBits, a maximum of 7 bits might still be stored into local register.
79*c03c5b1cSMartin Matuska *
80*c03c5b1cSMartin Matuska *  Avoid storing elements of more than 24 bits if you want compatibility with 32-bits bitstream readers.
81*c03c5b1cSMartin Matuska *
82*c03c5b1cSMartin Matuska *  Last operation is to close the bitStream.
83*c03c5b1cSMartin Matuska *  The function returns the final size of CStream in bytes.
84*c03c5b1cSMartin Matuska *  If data couldn't fit into `dstBuffer`, it will return a 0 ( == not storable)
85*c03c5b1cSMartin Matuska */
86*c03c5b1cSMartin Matuska 
87*c03c5b1cSMartin Matuska 
88*c03c5b1cSMartin Matuska /*-********************************************
89*c03c5b1cSMartin Matuska *  bitStream decoding API (read backward)
90*c03c5b1cSMartin Matuska **********************************************/
91*c03c5b1cSMartin Matuska typedef struct {
92*c03c5b1cSMartin Matuska     size_t   bitContainer;
93*c03c5b1cSMartin Matuska     unsigned bitsConsumed;
94*c03c5b1cSMartin Matuska     const char* ptr;
95*c03c5b1cSMartin Matuska     const char* start;
96*c03c5b1cSMartin Matuska     const char* limitPtr;
97*c03c5b1cSMartin Matuska } BIT_DStream_t;
98*c03c5b1cSMartin Matuska 
99*c03c5b1cSMartin Matuska typedef enum { BIT_DStream_unfinished = 0,
100*c03c5b1cSMartin Matuska                BIT_DStream_endOfBuffer = 1,
101*c03c5b1cSMartin Matuska                BIT_DStream_completed = 2,
102*c03c5b1cSMartin Matuska                BIT_DStream_overflow = 3 } BIT_DStream_status;  /* result of BIT_reloadDStream() */
103*c03c5b1cSMartin Matuska                /* 1,2,4,8 would be better for bitmap combinations, but slows down performance a bit ... :( */
104*c03c5b1cSMartin Matuska 
105*c03c5b1cSMartin Matuska MEM_STATIC size_t   BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize);
106*c03c5b1cSMartin Matuska MEM_STATIC size_t   BIT_readBits(BIT_DStream_t* bitD, unsigned nbBits);
107*c03c5b1cSMartin Matuska MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD);
108*c03c5b1cSMartin Matuska MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* bitD);
109*c03c5b1cSMartin Matuska 
110*c03c5b1cSMartin Matuska 
111*c03c5b1cSMartin Matuska /* Start by invoking BIT_initDStream().
112*c03c5b1cSMartin Matuska *  A chunk of the bitStream is then stored into a local register.
113*c03c5b1cSMartin Matuska *  Local register size is 64-bits on 64-bits systems, 32-bits on 32-bits systems (size_t).
114*c03c5b1cSMartin Matuska *  You can then retrieve bitFields stored into the local register, **in reverse order**.
115*c03c5b1cSMartin Matuska *  Local register is explicitly reloaded from memory by the BIT_reloadDStream() method.
116*c03c5b1cSMartin Matuska *  A reload guarantee a minimum of ((8*sizeof(bitD->bitContainer))-7) bits when its result is BIT_DStream_unfinished.
117*c03c5b1cSMartin Matuska *  Otherwise, it can be less than that, so proceed accordingly.
118*c03c5b1cSMartin Matuska *  Checking if DStream has reached its end can be performed with BIT_endOfDStream().
119*c03c5b1cSMartin Matuska */
120*c03c5b1cSMartin Matuska 
121*c03c5b1cSMartin Matuska 
122*c03c5b1cSMartin Matuska /*-****************************************
123*c03c5b1cSMartin Matuska *  unsafe API
124*c03c5b1cSMartin Matuska ******************************************/
125*c03c5b1cSMartin Matuska MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC, size_t value, unsigned nbBits);
126*c03c5b1cSMartin Matuska /* faster, but works only if value is "clean", meaning all high bits above nbBits are 0 */
127*c03c5b1cSMartin Matuska 
128*c03c5b1cSMartin Matuska MEM_STATIC void BIT_flushBitsFast(BIT_CStream_t* bitC);
129*c03c5b1cSMartin Matuska /* unsafe version; does not check buffer overflow */
130*c03c5b1cSMartin Matuska 
131*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, unsigned nbBits);
132*c03c5b1cSMartin Matuska /* faster, but works only if nbBits >= 1 */
133*c03c5b1cSMartin Matuska 
134*c03c5b1cSMartin Matuska 
135*c03c5b1cSMartin Matuska 
136*c03c5b1cSMartin Matuska /*-**************************************************************
137*c03c5b1cSMartin Matuska *  Internal functions
138*c03c5b1cSMartin Matuska ****************************************************************/
BIT_highbit32(U32 val)139*c03c5b1cSMartin Matuska MEM_STATIC unsigned BIT_highbit32 (U32 val)
140*c03c5b1cSMartin Matuska {
141*c03c5b1cSMartin Matuska     assert(val != 0);
142*c03c5b1cSMartin Matuska     {
143*c03c5b1cSMartin Matuska #   if defined(_MSC_VER)   /* Visual */
144*c03c5b1cSMartin Matuska         unsigned long r=0;
145*c03c5b1cSMartin Matuska         return _BitScanReverse ( &r, val ) ? (unsigned)r : 0;
146*c03c5b1cSMartin Matuska #   elif defined(__GNUC__) && (__GNUC__ >= 3)   /* Use GCC Intrinsic */
147*c03c5b1cSMartin Matuska         return __builtin_clz (val) ^ 31;
148*c03c5b1cSMartin Matuska #   elif defined(__ICCARM__)    /* IAR Intrinsic */
149*c03c5b1cSMartin Matuska         return 31 - __CLZ(val);
150*c03c5b1cSMartin Matuska #   else   /* Software version */
151*c03c5b1cSMartin Matuska         static const unsigned DeBruijnClz[32] = { 0,  9,  1, 10, 13, 21,  2, 29,
152*c03c5b1cSMartin Matuska                                                  11, 14, 16, 18, 22, 25,  3, 30,
153*c03c5b1cSMartin Matuska                                                   8, 12, 20, 28, 15, 17, 24,  7,
154*c03c5b1cSMartin Matuska                                                  19, 27, 23,  6, 26,  5,  4, 31 };
155*c03c5b1cSMartin Matuska         U32 v = val;
156*c03c5b1cSMartin Matuska         v |= v >> 1;
157*c03c5b1cSMartin Matuska         v |= v >> 2;
158*c03c5b1cSMartin Matuska         v |= v >> 4;
159*c03c5b1cSMartin Matuska         v |= v >> 8;
160*c03c5b1cSMartin Matuska         v |= v >> 16;
161*c03c5b1cSMartin Matuska         return DeBruijnClz[ (U32) (v * 0x07C4ACDDU) >> 27];
162*c03c5b1cSMartin Matuska #   endif
163*c03c5b1cSMartin Matuska     }
164*c03c5b1cSMartin Matuska }
165*c03c5b1cSMartin Matuska 
166*c03c5b1cSMartin Matuska /*=====    Local Constants   =====*/
167*c03c5b1cSMartin Matuska static const unsigned BIT_mask[] = {
168*c03c5b1cSMartin Matuska     0,          1,         3,         7,         0xF,       0x1F,
169*c03c5b1cSMartin Matuska     0x3F,       0x7F,      0xFF,      0x1FF,     0x3FF,     0x7FF,
170*c03c5b1cSMartin Matuska     0xFFF,      0x1FFF,    0x3FFF,    0x7FFF,    0xFFFF,    0x1FFFF,
171*c03c5b1cSMartin Matuska     0x3FFFF,    0x7FFFF,   0xFFFFF,   0x1FFFFF,  0x3FFFFF,  0x7FFFFF,
172*c03c5b1cSMartin Matuska     0xFFFFFF,   0x1FFFFFF, 0x3FFFFFF, 0x7FFFFFF, 0xFFFFFFF, 0x1FFFFFFF,
173*c03c5b1cSMartin Matuska     0x3FFFFFFF, 0x7FFFFFFF}; /* up to 31 bits */
174*c03c5b1cSMartin Matuska #define BIT_MASK_SIZE (sizeof(BIT_mask) / sizeof(BIT_mask[0]))
175*c03c5b1cSMartin Matuska 
176*c03c5b1cSMartin Matuska /*-**************************************************************
177*c03c5b1cSMartin Matuska *  bitStream encoding
178*c03c5b1cSMartin Matuska ****************************************************************/
179*c03c5b1cSMartin Matuska /*! BIT_initCStream() :
180*c03c5b1cSMartin Matuska  *  `dstCapacity` must be > sizeof(size_t)
181*c03c5b1cSMartin Matuska  *  @return : 0 if success,
182*c03c5b1cSMartin Matuska  *            otherwise an error code (can be tested using ERR_isError()) */
BIT_initCStream(BIT_CStream_t * bitC,void * startPtr,size_t dstCapacity)183*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_initCStream(BIT_CStream_t* bitC,
184*c03c5b1cSMartin Matuska                                   void* startPtr, size_t dstCapacity)
185*c03c5b1cSMartin Matuska {
186*c03c5b1cSMartin Matuska     bitC->bitContainer = 0;
187*c03c5b1cSMartin Matuska     bitC->bitPos = 0;
188*c03c5b1cSMartin Matuska     bitC->startPtr = (char*)startPtr;
189*c03c5b1cSMartin Matuska     bitC->ptr = bitC->startPtr;
190*c03c5b1cSMartin Matuska     bitC->endPtr = bitC->startPtr + dstCapacity - sizeof(bitC->bitContainer);
191*c03c5b1cSMartin Matuska     if (dstCapacity <= sizeof(bitC->bitContainer)) return ERROR(dstSize_tooSmall);
192*c03c5b1cSMartin Matuska     return 0;
193*c03c5b1cSMartin Matuska }
194*c03c5b1cSMartin Matuska 
195*c03c5b1cSMartin Matuska /*! BIT_addBits() :
196*c03c5b1cSMartin Matuska  *  can add up to 31 bits into `bitC`.
197*c03c5b1cSMartin Matuska  *  Note : does not check for register overflow ! */
BIT_addBits(BIT_CStream_t * bitC,size_t value,unsigned nbBits)198*c03c5b1cSMartin Matuska MEM_STATIC void BIT_addBits(BIT_CStream_t* bitC,
199*c03c5b1cSMartin Matuska                             size_t value, unsigned nbBits)
200*c03c5b1cSMartin Matuska {
201*c03c5b1cSMartin Matuska     MEM_STATIC_ASSERT(BIT_MASK_SIZE == 32);
202*c03c5b1cSMartin Matuska     assert(nbBits < BIT_MASK_SIZE);
203*c03c5b1cSMartin Matuska     assert(nbBits + bitC->bitPos < sizeof(bitC->bitContainer) * 8);
204*c03c5b1cSMartin Matuska     bitC->bitContainer |= (value & BIT_mask[nbBits]) << bitC->bitPos;
205*c03c5b1cSMartin Matuska     bitC->bitPos += nbBits;
206*c03c5b1cSMartin Matuska }
207*c03c5b1cSMartin Matuska 
208*c03c5b1cSMartin Matuska /*! BIT_addBitsFast() :
209*c03c5b1cSMartin Matuska  *  works only if `value` is _clean_,
210*c03c5b1cSMartin Matuska  *  meaning all high bits above nbBits are 0 */
BIT_addBitsFast(BIT_CStream_t * bitC,size_t value,unsigned nbBits)211*c03c5b1cSMartin Matuska MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC,
212*c03c5b1cSMartin Matuska                                 size_t value, unsigned nbBits)
213*c03c5b1cSMartin Matuska {
214*c03c5b1cSMartin Matuska     assert((value>>nbBits) == 0);
215*c03c5b1cSMartin Matuska     assert(nbBits + bitC->bitPos < sizeof(bitC->bitContainer) * 8);
216*c03c5b1cSMartin Matuska     bitC->bitContainer |= value << bitC->bitPos;
217*c03c5b1cSMartin Matuska     bitC->bitPos += nbBits;
218*c03c5b1cSMartin Matuska }
219*c03c5b1cSMartin Matuska 
220*c03c5b1cSMartin Matuska /*! BIT_flushBitsFast() :
221*c03c5b1cSMartin Matuska  *  assumption : bitContainer has not overflowed
222*c03c5b1cSMartin Matuska  *  unsafe version; does not check buffer overflow */
BIT_flushBitsFast(BIT_CStream_t * bitC)223*c03c5b1cSMartin Matuska MEM_STATIC void BIT_flushBitsFast(BIT_CStream_t* bitC)
224*c03c5b1cSMartin Matuska {
225*c03c5b1cSMartin Matuska     size_t const nbBytes = bitC->bitPos >> 3;
226*c03c5b1cSMartin Matuska     assert(bitC->bitPos < sizeof(bitC->bitContainer) * 8);
227*c03c5b1cSMartin Matuska     assert(bitC->ptr <= bitC->endPtr);
228*c03c5b1cSMartin Matuska     MEM_writeLEST(bitC->ptr, bitC->bitContainer);
229*c03c5b1cSMartin Matuska     bitC->ptr += nbBytes;
230*c03c5b1cSMartin Matuska     bitC->bitPos &= 7;
231*c03c5b1cSMartin Matuska     bitC->bitContainer >>= nbBytes*8;
232*c03c5b1cSMartin Matuska }
233*c03c5b1cSMartin Matuska 
234*c03c5b1cSMartin Matuska /*! BIT_flushBits() :
235*c03c5b1cSMartin Matuska  *  assumption : bitContainer has not overflowed
236*c03c5b1cSMartin Matuska  *  safe version; check for buffer overflow, and prevents it.
237*c03c5b1cSMartin Matuska  *  note : does not signal buffer overflow.
238*c03c5b1cSMartin Matuska  *  overflow will be revealed later on using BIT_closeCStream() */
BIT_flushBits(BIT_CStream_t * bitC)239*c03c5b1cSMartin Matuska MEM_STATIC void BIT_flushBits(BIT_CStream_t* bitC)
240*c03c5b1cSMartin Matuska {
241*c03c5b1cSMartin Matuska     size_t const nbBytes = bitC->bitPos >> 3;
242*c03c5b1cSMartin Matuska     assert(bitC->bitPos < sizeof(bitC->bitContainer) * 8);
243*c03c5b1cSMartin Matuska     assert(bitC->ptr <= bitC->endPtr);
244*c03c5b1cSMartin Matuska     MEM_writeLEST(bitC->ptr, bitC->bitContainer);
245*c03c5b1cSMartin Matuska     bitC->ptr += nbBytes;
246*c03c5b1cSMartin Matuska     if (bitC->ptr > bitC->endPtr) bitC->ptr = bitC->endPtr;
247*c03c5b1cSMartin Matuska     bitC->bitPos &= 7;
248*c03c5b1cSMartin Matuska     bitC->bitContainer >>= nbBytes*8;
249*c03c5b1cSMartin Matuska }
250*c03c5b1cSMartin Matuska 
251*c03c5b1cSMartin Matuska /*! BIT_closeCStream() :
252*c03c5b1cSMartin Matuska  *  @return : size of CStream, in bytes,
253*c03c5b1cSMartin Matuska  *            or 0 if it could not fit into dstBuffer */
BIT_closeCStream(BIT_CStream_t * bitC)254*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_closeCStream(BIT_CStream_t* bitC)
255*c03c5b1cSMartin Matuska {
256*c03c5b1cSMartin Matuska     BIT_addBitsFast(bitC, 1, 1);   /* endMark */
257*c03c5b1cSMartin Matuska     BIT_flushBits(bitC);
258*c03c5b1cSMartin Matuska     if (bitC->ptr >= bitC->endPtr) return 0; /* overflow detected */
259*c03c5b1cSMartin Matuska     return (bitC->ptr - bitC->startPtr) + (bitC->bitPos > 0);
260*c03c5b1cSMartin Matuska }
261*c03c5b1cSMartin Matuska 
262*c03c5b1cSMartin Matuska 
263*c03c5b1cSMartin Matuska /*-********************************************************
264*c03c5b1cSMartin Matuska *  bitStream decoding
265*c03c5b1cSMartin Matuska **********************************************************/
266*c03c5b1cSMartin Matuska /*! BIT_initDStream() :
267*c03c5b1cSMartin Matuska  *  Initialize a BIT_DStream_t.
268*c03c5b1cSMartin Matuska  * `bitD` : a pointer to an already allocated BIT_DStream_t structure.
269*c03c5b1cSMartin Matuska  * `srcSize` must be the *exact* size of the bitStream, in bytes.
270*c03c5b1cSMartin Matuska  * @return : size of stream (== srcSize), or an errorCode if a problem is detected
271*c03c5b1cSMartin Matuska  */
BIT_initDStream(BIT_DStream_t * bitD,const void * srcBuffer,size_t srcSize)272*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize)
273*c03c5b1cSMartin Matuska {
274*c03c5b1cSMartin Matuska     if (srcSize < 1) { memset(bitD, 0, sizeof(*bitD)); return ERROR(srcSize_wrong); }
275*c03c5b1cSMartin Matuska 
276*c03c5b1cSMartin Matuska     bitD->start = (const char*)srcBuffer;
277*c03c5b1cSMartin Matuska     bitD->limitPtr = bitD->start + sizeof(bitD->bitContainer);
278*c03c5b1cSMartin Matuska 
279*c03c5b1cSMartin Matuska     if (srcSize >=  sizeof(bitD->bitContainer)) {  /* normal case */
280*c03c5b1cSMartin Matuska         bitD->ptr   = (const char*)srcBuffer + srcSize - sizeof(bitD->bitContainer);
281*c03c5b1cSMartin Matuska         bitD->bitContainer = MEM_readLEST(bitD->ptr);
282*c03c5b1cSMartin Matuska         { BYTE const lastByte = ((const BYTE*)srcBuffer)[srcSize-1];
283*c03c5b1cSMartin Matuska           bitD->bitsConsumed = lastByte ? 8 - BIT_highbit32(lastByte) : 0;  /* ensures bitsConsumed is always set */
284*c03c5b1cSMartin Matuska           if (lastByte == 0) return ERROR(GENERIC); /* endMark not present */ }
285*c03c5b1cSMartin Matuska     } else {
286*c03c5b1cSMartin Matuska         bitD->ptr   = bitD->start;
287*c03c5b1cSMartin Matuska         bitD->bitContainer = *(const BYTE*)(bitD->start);
288*c03c5b1cSMartin Matuska         switch(srcSize)
289*c03c5b1cSMartin Matuska         {
290*c03c5b1cSMartin Matuska         case 7: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[6]) << (sizeof(bitD->bitContainer)*8 - 16);
291*c03c5b1cSMartin Matuska                 /* fall-through */
292*c03c5b1cSMartin Matuska 
293*c03c5b1cSMartin Matuska         case 6: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[5]) << (sizeof(bitD->bitContainer)*8 - 24);
294*c03c5b1cSMartin Matuska                 /* fall-through */
295*c03c5b1cSMartin Matuska 
296*c03c5b1cSMartin Matuska         case 5: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[4]) << (sizeof(bitD->bitContainer)*8 - 32);
297*c03c5b1cSMartin Matuska                 /* fall-through */
298*c03c5b1cSMartin Matuska 
299*c03c5b1cSMartin Matuska         case 4: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[3]) << 24;
300*c03c5b1cSMartin Matuska                 /* fall-through */
301*c03c5b1cSMartin Matuska 
302*c03c5b1cSMartin Matuska         case 3: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[2]) << 16;
303*c03c5b1cSMartin Matuska                 /* fall-through */
304*c03c5b1cSMartin Matuska 
305*c03c5b1cSMartin Matuska         case 2: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[1]) <<  8;
306*c03c5b1cSMartin Matuska                 /* fall-through */
307*c03c5b1cSMartin Matuska 
308*c03c5b1cSMartin Matuska         default: break;
309*c03c5b1cSMartin Matuska         }
310*c03c5b1cSMartin Matuska         {   BYTE const lastByte = ((const BYTE*)srcBuffer)[srcSize-1];
311*c03c5b1cSMartin Matuska             bitD->bitsConsumed = lastByte ? 8 - BIT_highbit32(lastByte) : 0;
312*c03c5b1cSMartin Matuska             if (lastByte == 0) return ERROR(corruption_detected);  /* endMark not present */
313*c03c5b1cSMartin Matuska         }
314*c03c5b1cSMartin Matuska         bitD->bitsConsumed += (U32)(sizeof(bitD->bitContainer) - srcSize)*8;
315*c03c5b1cSMartin Matuska     }
316*c03c5b1cSMartin Matuska 
317*c03c5b1cSMartin Matuska     return srcSize;
318*c03c5b1cSMartin Matuska }
319*c03c5b1cSMartin Matuska 
BIT_getUpperBits(size_t bitContainer,U32 const start)320*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_getUpperBits(size_t bitContainer, U32 const start)
321*c03c5b1cSMartin Matuska {
322*c03c5b1cSMartin Matuska     return bitContainer >> start;
323*c03c5b1cSMartin Matuska }
324*c03c5b1cSMartin Matuska 
BIT_getMiddleBits(size_t bitContainer,U32 const start,U32 const nbBits)325*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_getMiddleBits(size_t bitContainer, U32 const start, U32 const nbBits)
326*c03c5b1cSMartin Matuska {
327*c03c5b1cSMartin Matuska     U32 const regMask = sizeof(bitContainer)*8 - 1;
328*c03c5b1cSMartin Matuska     /* if start > regMask, bitstream is corrupted, and result is undefined */
329*c03c5b1cSMartin Matuska     assert(nbBits < BIT_MASK_SIZE);
330*c03c5b1cSMartin Matuska     return (bitContainer >> (start & regMask)) & BIT_mask[nbBits];
331*c03c5b1cSMartin Matuska }
332*c03c5b1cSMartin Matuska 
BIT_getLowerBits(size_t bitContainer,U32 const nbBits)333*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_getLowerBits(size_t bitContainer, U32 const nbBits)
334*c03c5b1cSMartin Matuska {
335*c03c5b1cSMartin Matuska     assert(nbBits < BIT_MASK_SIZE);
336*c03c5b1cSMartin Matuska     return bitContainer & BIT_mask[nbBits];
337*c03c5b1cSMartin Matuska }
338*c03c5b1cSMartin Matuska 
339*c03c5b1cSMartin Matuska /*! BIT_lookBits() :
340*c03c5b1cSMartin Matuska  *  Provides next n bits from local register.
341*c03c5b1cSMartin Matuska  *  local register is not modified.
342*c03c5b1cSMartin Matuska  *  On 32-bits, maxNbBits==24.
343*c03c5b1cSMartin Matuska  *  On 64-bits, maxNbBits==56.
344*c03c5b1cSMartin Matuska  * @return : value extracted */
BIT_lookBits(const BIT_DStream_t * bitD,U32 nbBits)345*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_lookBits(const BIT_DStream_t* bitD, U32 nbBits)
346*c03c5b1cSMartin Matuska {
347*c03c5b1cSMartin Matuska     /* arbitrate between double-shift and shift+mask */
348*c03c5b1cSMartin Matuska #if 1
349*c03c5b1cSMartin Matuska     /* if bitD->bitsConsumed + nbBits > sizeof(bitD->bitContainer)*8,
350*c03c5b1cSMartin Matuska      * bitstream is likely corrupted, and result is undefined */
351*c03c5b1cSMartin Matuska     return BIT_getMiddleBits(bitD->bitContainer, (sizeof(bitD->bitContainer)*8) - bitD->bitsConsumed - nbBits, nbBits);
352*c03c5b1cSMartin Matuska #else
353*c03c5b1cSMartin Matuska     /* this code path is slower on my os-x laptop */
354*c03c5b1cSMartin Matuska     U32 const regMask = sizeof(bitD->bitContainer)*8 - 1;
355*c03c5b1cSMartin Matuska     return ((bitD->bitContainer << (bitD->bitsConsumed & regMask)) >> 1) >> ((regMask-nbBits) & regMask);
356*c03c5b1cSMartin Matuska #endif
357*c03c5b1cSMartin Matuska }
358*c03c5b1cSMartin Matuska 
359*c03c5b1cSMartin Matuska /*! BIT_lookBitsFast() :
360*c03c5b1cSMartin Matuska  *  unsafe version; only works if nbBits >= 1 */
BIT_lookBitsFast(const BIT_DStream_t * bitD,U32 nbBits)361*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_lookBitsFast(const BIT_DStream_t* bitD, U32 nbBits)
362*c03c5b1cSMartin Matuska {
363*c03c5b1cSMartin Matuska     U32 const regMask = sizeof(bitD->bitContainer)*8 - 1;
364*c03c5b1cSMartin Matuska     assert(nbBits >= 1);
365*c03c5b1cSMartin Matuska     return (bitD->bitContainer << (bitD->bitsConsumed & regMask)) >> (((regMask+1)-nbBits) & regMask);
366*c03c5b1cSMartin Matuska }
367*c03c5b1cSMartin Matuska 
BIT_skipBits(BIT_DStream_t * bitD,U32 nbBits)368*c03c5b1cSMartin Matuska MEM_STATIC void BIT_skipBits(BIT_DStream_t* bitD, U32 nbBits)
369*c03c5b1cSMartin Matuska {
370*c03c5b1cSMartin Matuska     bitD->bitsConsumed += nbBits;
371*c03c5b1cSMartin Matuska }
372*c03c5b1cSMartin Matuska 
373*c03c5b1cSMartin Matuska /*! BIT_readBits() :
374*c03c5b1cSMartin Matuska  *  Read (consume) next n bits from local register and update.
375*c03c5b1cSMartin Matuska  *  Pay attention to not read more than nbBits contained into local register.
376*c03c5b1cSMartin Matuska  * @return : extracted value. */
BIT_readBits(BIT_DStream_t * bitD,unsigned nbBits)377*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_readBits(BIT_DStream_t* bitD, unsigned nbBits)
378*c03c5b1cSMartin Matuska {
379*c03c5b1cSMartin Matuska     size_t const value = BIT_lookBits(bitD, nbBits);
380*c03c5b1cSMartin Matuska     BIT_skipBits(bitD, nbBits);
381*c03c5b1cSMartin Matuska     return value;
382*c03c5b1cSMartin Matuska }
383*c03c5b1cSMartin Matuska 
384*c03c5b1cSMartin Matuska /*! BIT_readBitsFast() :
385*c03c5b1cSMartin Matuska  *  unsafe version; only works only if nbBits >= 1 */
BIT_readBitsFast(BIT_DStream_t * bitD,unsigned nbBits)386*c03c5b1cSMartin Matuska MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, unsigned nbBits)
387*c03c5b1cSMartin Matuska {
388*c03c5b1cSMartin Matuska     size_t const value = BIT_lookBitsFast(bitD, nbBits);
389*c03c5b1cSMartin Matuska     assert(nbBits >= 1);
390*c03c5b1cSMartin Matuska     BIT_skipBits(bitD, nbBits);
391*c03c5b1cSMartin Matuska     return value;
392*c03c5b1cSMartin Matuska }
393*c03c5b1cSMartin Matuska 
394*c03c5b1cSMartin Matuska /*! BIT_reloadDStreamFast() :
395*c03c5b1cSMartin Matuska  *  Similar to BIT_reloadDStream(), but with two differences:
396*c03c5b1cSMartin Matuska  *  1. bitsConsumed <= sizeof(bitD->bitContainer)*8 must hold!
397*c03c5b1cSMartin Matuska  *  2. Returns BIT_DStream_overflow when bitD->ptr < bitD->limitPtr, at this
398*c03c5b1cSMartin Matuska  *     point you must use BIT_reloadDStream() to reload.
399*c03c5b1cSMartin Matuska  */
BIT_reloadDStreamFast(BIT_DStream_t * bitD)400*c03c5b1cSMartin Matuska MEM_STATIC BIT_DStream_status BIT_reloadDStreamFast(BIT_DStream_t* bitD)
401*c03c5b1cSMartin Matuska {
402*c03c5b1cSMartin Matuska     if (UNLIKELY(bitD->ptr < bitD->limitPtr))
403*c03c5b1cSMartin Matuska         return BIT_DStream_overflow;
404*c03c5b1cSMartin Matuska     assert(bitD->bitsConsumed <= sizeof(bitD->bitContainer)*8);
405*c03c5b1cSMartin Matuska     bitD->ptr -= bitD->bitsConsumed >> 3;
406*c03c5b1cSMartin Matuska     bitD->bitsConsumed &= 7;
407*c03c5b1cSMartin Matuska     bitD->bitContainer = MEM_readLEST(bitD->ptr);
408*c03c5b1cSMartin Matuska     return BIT_DStream_unfinished;
409*c03c5b1cSMartin Matuska }
410*c03c5b1cSMartin Matuska 
411*c03c5b1cSMartin Matuska /*! BIT_reloadDStream() :
412*c03c5b1cSMartin Matuska  *  Refill `bitD` from buffer previously set in BIT_initDStream() .
413*c03c5b1cSMartin Matuska  *  This function is safe, it guarantees it will not read beyond src buffer.
414*c03c5b1cSMartin Matuska  * @return : status of `BIT_DStream_t` internal register.
415*c03c5b1cSMartin Matuska  *           when status == BIT_DStream_unfinished, internal register is filled with at least 25 or 57 bits */
BIT_reloadDStream(BIT_DStream_t * bitD)416*c03c5b1cSMartin Matuska MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD)
417*c03c5b1cSMartin Matuska {
418*c03c5b1cSMartin Matuska     if (bitD->bitsConsumed > (sizeof(bitD->bitContainer)*8))  /* overflow detected, like end of stream */
419*c03c5b1cSMartin Matuska         return BIT_DStream_overflow;
420*c03c5b1cSMartin Matuska 
421*c03c5b1cSMartin Matuska     if (bitD->ptr >= bitD->limitPtr) {
422*c03c5b1cSMartin Matuska         return BIT_reloadDStreamFast(bitD);
423*c03c5b1cSMartin Matuska     }
424*c03c5b1cSMartin Matuska     if (bitD->ptr == bitD->start) {
425*c03c5b1cSMartin Matuska         if (bitD->bitsConsumed < sizeof(bitD->bitContainer)*8) return BIT_DStream_endOfBuffer;
426*c03c5b1cSMartin Matuska         return BIT_DStream_completed;
427*c03c5b1cSMartin Matuska     }
428*c03c5b1cSMartin Matuska     /* start < ptr < limitPtr */
429*c03c5b1cSMartin Matuska     {   U32 nbBytes = bitD->bitsConsumed >> 3;
430*c03c5b1cSMartin Matuska         BIT_DStream_status result = BIT_DStream_unfinished;
431*c03c5b1cSMartin Matuska         if (bitD->ptr - nbBytes < bitD->start) {
432*c03c5b1cSMartin Matuska             nbBytes = (U32)(bitD->ptr - bitD->start);  /* ptr > start */
433*c03c5b1cSMartin Matuska             result = BIT_DStream_endOfBuffer;
434*c03c5b1cSMartin Matuska         }
435*c03c5b1cSMartin Matuska         bitD->ptr -= nbBytes;
436*c03c5b1cSMartin Matuska         bitD->bitsConsumed -= nbBytes*8;
437*c03c5b1cSMartin Matuska         bitD->bitContainer = MEM_readLEST(bitD->ptr);   /* reminder : srcSize > sizeof(bitD->bitContainer), otherwise bitD->ptr == bitD->start */
438*c03c5b1cSMartin Matuska         return result;
439*c03c5b1cSMartin Matuska     }
440*c03c5b1cSMartin Matuska }
441*c03c5b1cSMartin Matuska 
442*c03c5b1cSMartin Matuska /*! BIT_endOfDStream() :
443*c03c5b1cSMartin Matuska  * @return : 1 if DStream has _exactly_ reached its end (all bits consumed).
444*c03c5b1cSMartin Matuska  */
BIT_endOfDStream(const BIT_DStream_t * DStream)445*c03c5b1cSMartin Matuska MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* DStream)
446*c03c5b1cSMartin Matuska {
447*c03c5b1cSMartin Matuska     return ((DStream->ptr == DStream->start) && (DStream->bitsConsumed == sizeof(DStream->bitContainer)*8));
448*c03c5b1cSMartin Matuska }
449*c03c5b1cSMartin Matuska 
450*c03c5b1cSMartin Matuska #if defined (__cplusplus)
451*c03c5b1cSMartin Matuska }
452*c03c5b1cSMartin Matuska #endif
453*c03c5b1cSMartin Matuska 
454*c03c5b1cSMartin Matuska #endif /* BITSTREAM_H_MODULE */
455