blob: 2f91460c5eb0a0e319c8f0b91e4f8e041ff59da5 [file] [log] [blame]
Yann Colletb1f3f4b2015-10-18 22:18:32 +01001/* ******************************************************************
2 bitstream
Yann Colletae7aa062016-02-03 02:46:46 +01003 Part of FSE library
Yann Colletfa41bcc2018-06-13 14:59:26 -04004 Copyright (C) 2013-present, Yann Collet.
Yann Colletb1f3f4b2015-10-18 22:18:32 +01005
6 BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
7
8 Redistribution and use in source and binary forms, with or without
9 modification, are permitted provided that the following conditions are
10 met:
11
12 * Redistributions of source code must retain the above copyright
13 notice, this list of conditions and the following disclaimer.
14 * Redistributions in binary form must reproduce the above
15 copyright notice, this list of conditions and the following disclaimer
16 in the documentation and/or other materials provided with the
17 distribution.
18
19 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20 "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21 LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22 A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23 OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25 LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26 DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27 THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28 (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
31 You can contact the author at :
32 - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
Yann Colletb1f3f4b2015-10-18 22:18:32 +010033****************************************************************** */
34#ifndef BITSTREAM_H_MODULE
35#define BITSTREAM_H_MODULE
36
37#if defined (__cplusplus)
38extern "C" {
39#endif
40
Yann Colletb1f3f4b2015-10-18 22:18:32 +010041/*
Yann Collet01e5b952016-03-19 14:14:31 +010042* This API consists of small unitary functions, which must be inlined for best performance.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010043* Since link-time-optimization is not available for all compilers,
44* these functions are defined into a .h to be included.
45*/
46
Yann Colletae7aa062016-02-03 02:46:46 +010047/*-****************************************
48* Dependencies
Yann Colletb1f3f4b2015-10-18 22:18:32 +010049******************************************/
Yann Collet977f1f32016-01-21 15:38:47 +010050#include "mem.h" /* unaligned access routines */
Yann Colletfa41bcc2018-06-13 14:59:26 -040051#include "debug.h" /* assert(), DEBUGLOG(), RAWLOG() */
Yann Collet977f1f32016-01-21 15:38:47 +010052#include "error_private.h" /* error codes and messages */
Yann Colletb1f3f4b2015-10-18 22:18:32 +010053
54
Yann Collet74bd1192016-03-26 17:50:26 +010055/*=========================================
56* Target specific
57=========================================*/
58#if defined(__BMI__) && defined(__GNUC__)
59# include <immintrin.h> /* support for bextr (experimental) */
60#endif
61
Sean Purcelld44703d2017-03-01 14:36:25 -080062#define STREAM_ACCUMULATOR_MIN_32 25
63#define STREAM_ACCUMULATOR_MIN_64 57
64#define STREAM_ACCUMULATOR_MIN ((U32)(MEM_32bits() ? STREAM_ACCUMULATOR_MIN_32 : STREAM_ACCUMULATOR_MIN_64))
Yann Collet74bd1192016-03-26 17:50:26 +010065
Yann Collet8c910d22017-06-03 01:15:02 -070066
Yann Colletae7aa062016-02-03 02:46:46 +010067/*-******************************************
68* bitStream encoding API (write forward)
Yann Colletb1f3f4b2015-10-18 22:18:32 +010069********************************************/
Yann Colletd1d210f2016-03-19 12:12:07 +010070/* bitStream can mix input from multiple sources.
Yann Colletb71363b2017-07-19 01:05:40 -070071 * A critical property of these streams is that they encode and decode in **reverse** direction.
72 * So the first bit sequence you add will be the last to be read, like a LIFO stack.
73 */
Yann Colletfa41bcc2018-06-13 14:59:26 -040074typedef struct {
Yann Colletb1f3f4b2015-10-18 22:18:32 +010075 size_t bitContainer;
Yann Colletf39a6732017-05-01 09:56:03 -070076 unsigned bitPos;
Yann Colletb1f3f4b2015-10-18 22:18:32 +010077 char* startPtr;
78 char* ptr;
79 char* endPtr;
80} BIT_CStream_t;
81
Yann Colletae7aa062016-02-03 02:46:46 +010082MEM_STATIC size_t BIT_initCStream(BIT_CStream_t* bitC, void* dstBuffer, size_t dstCapacity);
Yann Colletb1f3f4b2015-10-18 22:18:32 +010083MEM_STATIC void BIT_addBits(BIT_CStream_t* bitC, size_t value, unsigned nbBits);
84MEM_STATIC void BIT_flushBits(BIT_CStream_t* bitC);
85MEM_STATIC size_t BIT_closeCStream(BIT_CStream_t* bitC);
86
Yann Collet01e5b952016-03-19 14:14:31 +010087/* Start with initCStream, providing the size of buffer to write into.
88* bitStream will never write outside of this buffer.
Yann Collet1032fbe2016-05-11 18:30:24 +020089* `dstCapacity` must be >= sizeof(bitD->bitContainer), otherwise @return will be an error code.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010090*
Yann Collet01e5b952016-03-19 14:14:31 +010091* bits are first added to a local register.
92* Local register is size_t, hence 64-bits on 64-bits systems, or 32-bits on 32-bits systems.
93* Writing data into memory is an explicit operation, performed by the flushBits function.
94* Hence keep track how many bits are potentially stored into local register to avoid register overflow.
95* After a flushBits, a maximum of 7 bits might still be stored into local register.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010096*
Yann Collet01e5b952016-03-19 14:14:31 +010097* Avoid storing elements of more than 24 bits if you want compatibility with 32-bits bitstream readers.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010098*
Yann Collet01e5b952016-03-19 14:14:31 +010099* Last operation is to close the bitStream.
100* The function returns the final size of CStream in bytes.
101* If data couldn't fit into `dstBuffer`, it will return a 0 ( == not storable)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100102*/
103
104
Yann Colletae7aa062016-02-03 02:46:46 +0100105/*-********************************************
106* bitStream decoding API (read backward)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100107**********************************************/
Yann Colletfa41bcc2018-06-13 14:59:26 -0400108typedef struct {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100109 size_t bitContainer;
110 unsigned bitsConsumed;
111 const char* ptr;
112 const char* start;
Yann Colletf39a6732017-05-01 09:56:03 -0700113 const char* limitPtr;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100114} BIT_DStream_t;
115
116typedef enum { BIT_DStream_unfinished = 0,
117 BIT_DStream_endOfBuffer = 1,
118 BIT_DStream_completed = 2,
119 BIT_DStream_overflow = 3 } BIT_DStream_status; /* result of BIT_reloadDStream() */
120 /* 1,2,4,8 would be better for bitmap combinations, but slows down performance a bit ... :( */
121
122MEM_STATIC size_t BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize);
123MEM_STATIC size_t BIT_readBits(BIT_DStream_t* bitD, unsigned nbBits);
124MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD);
125MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* bitD);
126
127
Yann Collet01e5b952016-03-19 14:14:31 +0100128/* Start by invoking BIT_initDStream().
129* A chunk of the bitStream is then stored into a local register.
130* Local register size is 64-bits on 64-bits systems, 32-bits on 32-bits systems (size_t).
131* You can then retrieve bitFields stored into the local register, **in reverse order**.
132* Local register is explicitly reloaded from memory by the BIT_reloadDStream() method.
Yann Collet1032fbe2016-05-11 18:30:24 +0200133* A reload guarantee a minimum of ((8*sizeof(bitD->bitContainer))-7) bits when its result is BIT_DStream_unfinished.
Yann Collet01e5b952016-03-19 14:14:31 +0100134* Otherwise, it can be less than that, so proceed accordingly.
Yann Colletb21ce152016-03-24 01:27:55 +0100135* Checking if DStream has reached its end can be performed with BIT_endOfDStream().
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100136*/
137
138
Yann Colletae7aa062016-02-03 02:46:46 +0100139/*-****************************************
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100140* unsafe API
141******************************************/
142MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC, size_t value, unsigned nbBits);
143/* faster, but works only if value is "clean", meaning all high bits above nbBits are 0 */
144
145MEM_STATIC void BIT_flushBitsFast(BIT_CStream_t* bitC);
146/* unsafe version; does not check buffer overflow */
147
148MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, unsigned nbBits);
149/* faster, but works only if nbBits >= 1 */
150
151
152
Yann Colletae7aa062016-02-03 02:46:46 +0100153/*-**************************************************************
Yann Collet6cf45da2016-03-23 14:18:37 +0100154* Internal functions
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100155****************************************************************/
Yann Colletc173dbd2017-12-04 17:57:42 -0800156MEM_STATIC unsigned BIT_highbit32 (U32 val)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100157{
Stella Laue50ed1f2017-08-22 11:55:42 -0700158 assert(val != 0);
159 {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100160# if defined(_MSC_VER) /* Visual */
Stella Laue50ed1f2017-08-22 11:55:42 -0700161 unsigned long r=0;
162 _BitScanReverse ( &r, val );
163 return (unsigned) r;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100164# elif defined(__GNUC__) && (__GNUC__ >= 3) /* Use GCC Intrinsic */
Stella Laue50ed1f2017-08-22 11:55:42 -0700165 return 31 - __builtin_clz (val);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100166# else /* Software version */
Stella Laue50ed1f2017-08-22 11:55:42 -0700167 static const unsigned DeBruijnClz[32] = { 0, 9, 1, 10, 13, 21, 2, 29,
168 11, 14, 16, 18, 22, 25, 3, 30,
169 8, 12, 20, 28, 15, 17, 24, 7,
170 19, 27, 23, 6, 26, 5, 4, 31 };
171 U32 v = val;
172 v |= v >> 1;
173 v |= v >> 2;
174 v |= v >> 4;
175 v |= v >> 8;
176 v |= v >> 16;
177 return DeBruijnClz[ (U32) (v * 0x07C4ACDDU) >> 27];
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100178# endif
Stella Laue50ed1f2017-08-22 11:55:42 -0700179 }
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100180}
181
Yann Collet6cf45da2016-03-23 14:18:37 +0100182/*===== Local Constants =====*/
Nick Terrell74718d72017-09-15 17:44:09 -0700183static const unsigned BIT_mask[] = {
184 0, 1, 3, 7, 0xF, 0x1F,
185 0x3F, 0x7F, 0xFF, 0x1FF, 0x3FF, 0x7FF,
186 0xFFF, 0x1FFF, 0x3FFF, 0x7FFF, 0xFFFF, 0x1FFFF,
187 0x3FFFF, 0x7FFFF, 0xFFFFF, 0x1FFFFF, 0x3FFFFF, 0x7FFFFF,
188 0xFFFFFF, 0x1FFFFFF, 0x3FFFFFF, 0x7FFFFFF, 0xFFFFFFF, 0x1FFFFFFF,
189 0x3FFFFFFF, 0x7FFFFFFF}; /* up to 31 bits */
190#define BIT_MASK_SIZE (sizeof(BIT_mask) / sizeof(BIT_mask[0]))
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100191
Yann Colletae7aa062016-02-03 02:46:46 +0100192/*-**************************************************************
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100193* bitStream encoding
194****************************************************************/
Yann Collet01e5b952016-03-19 14:14:31 +0100195/*! BIT_initCStream() :
Yann Colletf39a6732017-05-01 09:56:03 -0700196 * `dstCapacity` must be > sizeof(size_t)
Yann Collet01e5b952016-03-19 14:14:31 +0100197 * @return : 0 if success,
Yann Colletb71363b2017-07-19 01:05:40 -0700198 * otherwise an error code (can be tested using ERR_isError()) */
Yann Colletf39a6732017-05-01 09:56:03 -0700199MEM_STATIC size_t BIT_initCStream(BIT_CStream_t* bitC,
Yann Collet33c38b02017-05-01 11:12:30 -0700200 void* startPtr, size_t dstCapacity)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100201{
202 bitC->bitContainer = 0;
203 bitC->bitPos = 0;
204 bitC->startPtr = (char*)startPtr;
205 bitC->ptr = bitC->startPtr;
Yann Colletf39a6732017-05-01 09:56:03 -0700206 bitC->endPtr = bitC->startPtr + dstCapacity - sizeof(bitC->bitContainer);
207 if (dstCapacity <= sizeof(bitC->bitContainer)) return ERROR(dstSize_tooSmall);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100208 return 0;
209}
210
Yann Collet01e5b952016-03-19 14:14:31 +0100211/*! BIT_addBits() :
Nick Terrell74718d72017-09-15 17:44:09 -0700212 * can add up to 31 bits into `bitC`.
Yann Colletb71363b2017-07-19 01:05:40 -0700213 * Note : does not check for register overflow ! */
Yann Colletf39a6732017-05-01 09:56:03 -0700214MEM_STATIC void BIT_addBits(BIT_CStream_t* bitC,
Yann Collet33c38b02017-05-01 11:12:30 -0700215 size_t value, unsigned nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100216{
Nick Terrell74718d72017-09-15 17:44:09 -0700217 MEM_STATIC_ASSERT(BIT_MASK_SIZE == 32);
218 assert(nbBits < BIT_MASK_SIZE);
219 assert(nbBits + bitC->bitPos < sizeof(bitC->bitContainer) * 8);
Yann Collet6cf45da2016-03-23 14:18:37 +0100220 bitC->bitContainer |= (value & BIT_mask[nbBits]) << bitC->bitPos;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100221 bitC->bitPos += nbBits;
222}
223
Yann Colletd1d210f2016-03-19 12:12:07 +0100224/*! BIT_addBitsFast() :
Yann Colletfa41bcc2018-06-13 14:59:26 -0400225 * works only if `value` is _clean_,
226 * meaning all high bits above nbBits are 0 */
Yann Colletf39a6732017-05-01 09:56:03 -0700227MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC,
Yann Collet33c38b02017-05-01 11:12:30 -0700228 size_t value, unsigned nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100229{
Yann Collet202082f2017-04-28 16:56:39 -0700230 assert((value>>nbBits) == 0);
Nick Terrell74718d72017-09-15 17:44:09 -0700231 assert(nbBits + bitC->bitPos < sizeof(bitC->bitContainer) * 8);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100232 bitC->bitContainer |= value << bitC->bitPos;
233 bitC->bitPos += nbBits;
234}
235
Yann Colletd1d210f2016-03-19 12:12:07 +0100236/*! BIT_flushBitsFast() :
Yann Colletf39a6732017-05-01 09:56:03 -0700237 * assumption : bitContainer has not overflowed
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100238 * unsafe version; does not check buffer overflow */
239MEM_STATIC void BIT_flushBitsFast(BIT_CStream_t* bitC)
240{
Yann Colletd64f4352016-03-21 00:07:42 +0100241 size_t const nbBytes = bitC->bitPos >> 3;
Nick Terrell74718d72017-09-15 17:44:09 -0700242 assert(bitC->bitPos < sizeof(bitC->bitContainer) * 8);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100243 MEM_writeLEST(bitC->ptr, bitC->bitContainer);
244 bitC->ptr += nbBytes;
Yann Colletf39a6732017-05-01 09:56:03 -0700245 assert(bitC->ptr <= bitC->endPtr);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100246 bitC->bitPos &= 7;
Yann Colletf39a6732017-05-01 09:56:03 -0700247 bitC->bitContainer >>= nbBytes*8;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100248}
249
Yann Collet01e5b952016-03-19 14:14:31 +0100250/*! BIT_flushBits() :
Yann Colletf39a6732017-05-01 09:56:03 -0700251 * assumption : bitContainer has not overflowed
Yann Collet01e5b952016-03-19 14:14:31 +0100252 * safe version; check for buffer overflow, and prevents it.
Yann Collet33c38b02017-05-01 11:12:30 -0700253 * note : does not signal buffer overflow.
254 * overflow will be revealed later on using BIT_closeCStream() */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100255MEM_STATIC void BIT_flushBits(BIT_CStream_t* bitC)
256{
Yann Colletd64f4352016-03-21 00:07:42 +0100257 size_t const nbBytes = bitC->bitPos >> 3;
Nick Terrell74718d72017-09-15 17:44:09 -0700258 assert(bitC->bitPos < sizeof(bitC->bitContainer) * 8);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100259 MEM_writeLEST(bitC->ptr, bitC->bitContainer);
260 bitC->ptr += nbBytes;
261 if (bitC->ptr > bitC->endPtr) bitC->ptr = bitC->endPtr;
262 bitC->bitPos &= 7;
Yann Collet33c38b02017-05-01 11:12:30 -0700263 bitC->bitContainer >>= nbBytes*8;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100264}
265
Yann Colletd1d210f2016-03-19 12:12:07 +0100266/*! BIT_closeCStream() :
Yann Collet01e5b952016-03-19 14:14:31 +0100267 * @return : size of CStream, in bytes,
Yann Colletb71363b2017-07-19 01:05:40 -0700268 * or 0 if it could not fit into dstBuffer */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100269MEM_STATIC size_t BIT_closeCStream(BIT_CStream_t* bitC)
270{
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100271 BIT_addBitsFast(bitC, 1, 1); /* endMark */
272 BIT_flushBits(bitC);
Yann Collet33c38b02017-05-01 11:12:30 -0700273 if (bitC->ptr >= bitC->endPtr) return 0; /* overflow detected */
Yann Collet01e5b952016-03-19 14:14:31 +0100274 return (bitC->ptr - bitC->startPtr) + (bitC->bitPos > 0);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100275}
276
277
Yann Colletae7aa062016-02-03 02:46:46 +0100278/*-********************************************************
Yann Colletb71363b2017-07-19 01:05:40 -0700279* bitStream decoding
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100280**********************************************************/
Yann Collet01e5b952016-03-19 14:14:31 +0100281/*! BIT_initDStream() :
Yann Colletb71363b2017-07-19 01:05:40 -0700282 * Initialize a BIT_DStream_t.
283 * `bitD` : a pointer to an already allocated BIT_DStream_t structure.
284 * `srcSize` must be the *exact* size of the bitStream, in bytes.
285 * @return : size of stream (== srcSize), or an errorCode if a problem is detected
286 */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100287MEM_STATIC size_t BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize)
288{
289 if (srcSize < 1) { memset(bitD, 0, sizeof(*bitD)); return ERROR(srcSize_wrong); }
290
Yann Colletf39a6732017-05-01 09:56:03 -0700291 bitD->start = (const char*)srcBuffer;
292 bitD->limitPtr = bitD->start + sizeof(bitD->bitContainer);
293
Yann Collet1032fbe2016-05-11 18:30:24 +0200294 if (srcSize >= sizeof(bitD->bitContainer)) { /* normal case */
Yann Collet1032fbe2016-05-11 18:30:24 +0200295 bitD->ptr = (const char*)srcBuffer + srcSize - sizeof(bitD->bitContainer);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100296 bitD->bitContainer = MEM_readLEST(bitD->ptr);
Yann Colletb21ce152016-03-24 01:27:55 +0100297 { BYTE const lastByte = ((const BYTE*)srcBuffer)[srcSize-1];
Yann Collet5397a662016-12-13 15:21:06 +0100298 bitD->bitsConsumed = lastByte ? 8 - BIT_highbit32(lastByte) : 0; /* ensures bitsConsumed is always set */
Yann Collet18c8f792016-06-12 22:51:52 +0200299 if (lastByte == 0) return ERROR(GENERIC); /* endMark not present */ }
Yann Colletae7aa062016-02-03 02:46:46 +0100300 } else {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100301 bitD->ptr = bitD->start;
Yann Collet1ceb5a92016-05-12 13:50:13 +0200302 bitD->bitContainer = *(const BYTE*)(bitD->start);
303 switch(srcSize)
304 {
Yann Colletb71363b2017-07-19 01:05:40 -0700305 case 7: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[6]) << (sizeof(bitD->bitContainer)*8 - 16);
306 /* fall-through */
Jos Collin05286fd2017-05-09 08:36:05 +0530307
Yann Colletb71363b2017-07-19 01:05:40 -0700308 case 6: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[5]) << (sizeof(bitD->bitContainer)*8 - 24);
309 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700310
Yann Colletb71363b2017-07-19 01:05:40 -0700311 case 5: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[4]) << (sizeof(bitD->bitContainer)*8 - 32);
312 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700313
Yann Colletb71363b2017-07-19 01:05:40 -0700314 case 4: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[3]) << 24;
315 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700316
Yann Colletb71363b2017-07-19 01:05:40 -0700317 case 3: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[2]) << 16;
318 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700319
Yann Colletb71363b2017-07-19 01:05:40 -0700320 case 2: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[1]) << 8;
321 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700322
Yann Colletb71363b2017-07-19 01:05:40 -0700323 default: break;
Yann Collet1ceb5a92016-05-12 13:50:13 +0200324 }
Yann Colletb71363b2017-07-19 01:05:40 -0700325 { BYTE const lastByte = ((const BYTE*)srcBuffer)[srcSize-1];
326 bitD->bitsConsumed = lastByte ? 8 - BIT_highbit32(lastByte) : 0;
327 if (lastByte == 0) return ERROR(corruption_detected); /* endMark not present */
328 }
Yann Collet1032fbe2016-05-11 18:30:24 +0200329 bitD->bitsConsumed += (U32)(sizeof(bitD->bitContainer) - srcSize)*8;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100330 }
331
332 return srcSize;
333}
334
Yann Collet1032fbe2016-05-11 18:30:24 +0200335MEM_STATIC size_t BIT_getUpperBits(size_t bitContainer, U32 const start)
Yann Collet3c017862016-03-23 14:09:51 +0100336{
Yann Collet1032fbe2016-05-11 18:30:24 +0200337 return bitContainer >> start;
Yann Collet3c017862016-03-23 14:09:51 +0100338}
339
Yann Collet1032fbe2016-05-11 18:30:24 +0200340MEM_STATIC size_t BIT_getMiddleBits(size_t bitContainer, U32 const start, U32 const nbBits)
Yann Collet3c017862016-03-23 14:09:51 +0100341{
Yann Collet5397a662016-12-13 15:21:06 +0100342#if defined(__BMI__) && defined(__GNUC__) && __GNUC__*1000+__GNUC_MINOR__ >= 4008 /* experimental */
Yann Collet6f9c0562016-05-01 10:26:30 +0200343# if defined(__x86_64__)
Yann Collet1032fbe2016-05-11 18:30:24 +0200344 if (sizeof(bitContainer)==8)
345 return _bextr_u64(bitContainer, start, nbBits);
Yann Collet6f9c0562016-05-01 10:26:30 +0200346 else
347# endif
Yann Collet1032fbe2016-05-11 18:30:24 +0200348 return _bextr_u32(bitContainer, start, nbBits);
Yann Collet862a8592016-03-23 18:45:23 +0100349#else
Nick Terrell74718d72017-09-15 17:44:09 -0700350 assert(nbBits < BIT_MASK_SIZE);
Yann Collet1032fbe2016-05-11 18:30:24 +0200351 return (bitContainer >> start) & BIT_mask[nbBits];
Yann Collet862a8592016-03-23 18:45:23 +0100352#endif
Yann Collet3c017862016-03-23 14:09:51 +0100353}
354
Yann Collet1032fbe2016-05-11 18:30:24 +0200355MEM_STATIC size_t BIT_getLowerBits(size_t bitContainer, U32 const nbBits)
Yann Colletafab0202016-03-23 13:57:49 +0100356{
Nick Terrell74718d72017-09-15 17:44:09 -0700357 assert(nbBits < BIT_MASK_SIZE);
Yann Collet1032fbe2016-05-11 18:30:24 +0200358 return bitContainer & BIT_mask[nbBits];
Yann Colletafab0202016-03-23 13:57:49 +0100359}
360
Yann Collet01e5b952016-03-19 14:14:31 +0100361/*! BIT_lookBits() :
362 * Provides next n bits from local register.
Yann Collet1032fbe2016-05-11 18:30:24 +0200363 * local register is not modified.
Yann Collet01e5b952016-03-19 14:14:31 +0100364 * On 32-bits, maxNbBits==24.
365 * On 64-bits, maxNbBits==56.
Yann Colletb71363b2017-07-19 01:05:40 -0700366 * @return : value extracted */
367MEM_STATIC size_t BIT_lookBits(const BIT_DStream_t* bitD, U32 nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100368{
Yann Collet1032fbe2016-05-11 18:30:24 +0200369#if defined(__BMI__) && defined(__GNUC__) /* experimental; fails if bitD->bitsConsumed + nbBits > sizeof(bitD->bitContainer)*8 */
370 return BIT_getMiddleBits(bitD->bitContainer, (sizeof(bitD->bitContainer)*8) - bitD->bitsConsumed - nbBits, nbBits);
Yann Collet862a8592016-03-23 18:45:23 +0100371#else
Yann Colletf39a6732017-05-01 09:56:03 -0700372 U32 const regMask = sizeof(bitD->bitContainer)*8 - 1;
373 return ((bitD->bitContainer << (bitD->bitsConsumed & regMask)) >> 1) >> ((regMask-nbBits) & regMask);
Yann Collet862a8592016-03-23 18:45:23 +0100374#endif
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100375}
376
Yann Collet01e5b952016-03-19 14:14:31 +0100377/*! BIT_lookBitsFast() :
Yann Collet202082f2017-04-28 16:56:39 -0700378 * unsafe version; only works if nbBits >= 1 */
Yann Colletadd08d62016-03-23 01:32:41 +0100379MEM_STATIC size_t BIT_lookBitsFast(const BIT_DStream_t* bitD, U32 nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100380{
Yann Colletf39a6732017-05-01 09:56:03 -0700381 U32 const regMask = sizeof(bitD->bitContainer)*8 - 1;
Yann Collet202082f2017-04-28 16:56:39 -0700382 assert(nbBits >= 1);
Yann Colletf39a6732017-05-01 09:56:03 -0700383 return (bitD->bitContainer << (bitD->bitsConsumed & regMask)) >> (((regMask+1)-nbBits) & regMask);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100384}
385
386MEM_STATIC void BIT_skipBits(BIT_DStream_t* bitD, U32 nbBits)
387{
388 bitD->bitsConsumed += nbBits;
389}
390
Yann Collet01e5b952016-03-19 14:14:31 +0100391/*! BIT_readBits() :
Yann Colletb21ce152016-03-24 01:27:55 +0100392 * Read (consume) next n bits from local register and update.
393 * Pay attention to not read more than nbBits contained into local register.
Yann Colletb71363b2017-07-19 01:05:40 -0700394 * @return : extracted value. */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100395MEM_STATIC size_t BIT_readBits(BIT_DStream_t* bitD, U32 nbBits)
396{
Yann Colletafab0202016-03-23 13:57:49 +0100397 size_t const value = BIT_lookBits(bitD, nbBits);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100398 BIT_skipBits(bitD, nbBits);
399 return value;
400}
401
Yann Collet01e5b952016-03-19 14:14:31 +0100402/*! BIT_readBitsFast() :
Yann Colletb71363b2017-07-19 01:05:40 -0700403 * unsafe version; only works only if nbBits >= 1 */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100404MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, U32 nbBits)
405{
Yann Colletafab0202016-03-23 13:57:49 +0100406 size_t const value = BIT_lookBitsFast(bitD, nbBits);
Yann Collet202082f2017-04-28 16:56:39 -0700407 assert(nbBits >= 1);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100408 BIT_skipBits(bitD, nbBits);
409 return value;
410}
411
Yann Collet01e5b952016-03-19 14:14:31 +0100412/*! BIT_reloadDStream() :
Yann Colletb71363b2017-07-19 01:05:40 -0700413 * Refill `bitD` from buffer previously set in BIT_initDStream() .
414 * This function is safe, it guarantees it will not read beyond src buffer.
415 * @return : status of `BIT_DStream_t` internal register.
Baldur Karlsson430a2fe2018-03-13 20:02:21 +0000416 * when status == BIT_DStream_unfinished, internal register is filled with at least 25 or 57 bits */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100417MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD)
418{
Yann Colletf39a6732017-05-01 09:56:03 -0700419 if (bitD->bitsConsumed > (sizeof(bitD->bitContainer)*8)) /* overflow detected, like end of stream */
Nick Terrell5152fb22017-03-29 18:51:58 -0700420 return BIT_DStream_overflow;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100421
Yann Colletf39a6732017-05-01 09:56:03 -0700422 if (bitD->ptr >= bitD->limitPtr) {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100423 bitD->ptr -= bitD->bitsConsumed >> 3;
424 bitD->bitsConsumed &= 7;
425 bitD->bitContainer = MEM_readLEST(bitD->ptr);
426 return BIT_DStream_unfinished;
427 }
Yann Colletae7aa062016-02-03 02:46:46 +0100428 if (bitD->ptr == bitD->start) {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100429 if (bitD->bitsConsumed < sizeof(bitD->bitContainer)*8) return BIT_DStream_endOfBuffer;
430 return BIT_DStream_completed;
431 }
Yann Colletf39a6732017-05-01 09:56:03 -0700432 /* start < ptr < limitPtr */
Yann Collet01e5b952016-03-19 14:14:31 +0100433 { U32 nbBytes = bitD->bitsConsumed >> 3;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100434 BIT_DStream_status result = BIT_DStream_unfinished;
Yann Colletae7aa062016-02-03 02:46:46 +0100435 if (bitD->ptr - nbBytes < bitD->start) {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100436 nbBytes = (U32)(bitD->ptr - bitD->start); /* ptr > start */
437 result = BIT_DStream_endOfBuffer;
438 }
439 bitD->ptr -= nbBytes;
440 bitD->bitsConsumed -= nbBytes*8;
Yann Colletf39a6732017-05-01 09:56:03 -0700441 bitD->bitContainer = MEM_readLEST(bitD->ptr); /* reminder : srcSize > sizeof(bitD->bitContainer), otherwise bitD->ptr == bitD->start */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100442 return result;
443 }
444}
445
Yann Colletd1d210f2016-03-19 12:12:07 +0100446/*! BIT_endOfDStream() :
Yann Colletb71363b2017-07-19 01:05:40 -0700447 * @return : 1 if DStream has _exactly_ reached its end (all bits consumed).
448 */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100449MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* DStream)
450{
451 return ((DStream->ptr == DStream->start) && (DStream->bitsConsumed == sizeof(DStream->bitContainer)*8));
452}
453
454#if defined (__cplusplus)
455}
456#endif
457
458#endif /* BITSTREAM_H_MODULE */