blob: 37b99c01eed397fc2c9a28cfba5f683679628c4b [file] [log] [blame]
Yann Colletb1f3f4b2015-10-18 22:18:32 +01001/* ******************************************************************
Nick Terrellac58c8d2020-03-26 15:19:05 -07002 * bitstream
3 * Part of FSE library
4 * Copyright (c) 2013-2020, Yann Collet, Facebook, Inc.
5 *
6 * You can contact the author at :
7 * - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
8 *
9 * This source code is licensed under both the BSD-style license (found in the
10 * LICENSE file in the root directory of this source tree) and the GPLv2 (found
11 * in the COPYING file in the root directory of this source tree).
12 * You may select, at your option, one of the above-listed licenses.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010013****************************************************************** */
14#ifndef BITSTREAM_H_MODULE
15#define BITSTREAM_H_MODULE
16
17#if defined (__cplusplus)
18extern "C" {
19#endif
20
Yann Colletb1f3f4b2015-10-18 22:18:32 +010021/*
Yann Collet01e5b952016-03-19 14:14:31 +010022* This API consists of small unitary functions, which must be inlined for best performance.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010023* Since link-time-optimization is not available for all compilers,
24* these functions are defined into a .h to be included.
25*/
26
Yann Colletae7aa062016-02-03 02:46:46 +010027/*-****************************************
28* Dependencies
Yann Colletb1f3f4b2015-10-18 22:18:32 +010029******************************************/
Yann Collet977f1f32016-01-21 15:38:47 +010030#include "mem.h" /* unaligned access routines */
Nick Terrell718f00f2019-11-25 18:26:19 -080031#include "compiler.h" /* UNLIKELY() */
Yann Colletfa41bcc2018-06-13 14:59:26 -040032#include "debug.h" /* assert(), DEBUGLOG(), RAWLOG() */
Yann Collet977f1f32016-01-21 15:38:47 +010033#include "error_private.h" /* error codes and messages */
Yann Colletb1f3f4b2015-10-18 22:18:32 +010034
35
Yann Collet74bd1192016-03-26 17:50:26 +010036/*=========================================
37* Target specific
38=========================================*/
39#if defined(__BMI__) && defined(__GNUC__)
40# include <immintrin.h> /* support for bextr (experimental) */
Joseph Chen3855bc42019-07-29 15:20:37 +080041#elif defined(__ICCARM__)
42# include <intrinsics.h>
Yann Collet74bd1192016-03-26 17:50:26 +010043#endif
44
Sean Purcelld44703d2017-03-01 14:36:25 -080045#define STREAM_ACCUMULATOR_MIN_32 25
46#define STREAM_ACCUMULATOR_MIN_64 57
47#define STREAM_ACCUMULATOR_MIN ((U32)(MEM_32bits() ? STREAM_ACCUMULATOR_MIN_32 : STREAM_ACCUMULATOR_MIN_64))
Yann Collet74bd1192016-03-26 17:50:26 +010048
Yann Collet8c910d22017-06-03 01:15:02 -070049
Yann Colletae7aa062016-02-03 02:46:46 +010050/*-******************************************
51* bitStream encoding API (write forward)
Yann Colletb1f3f4b2015-10-18 22:18:32 +010052********************************************/
Yann Colletd1d210f2016-03-19 12:12:07 +010053/* bitStream can mix input from multiple sources.
Yann Colletb71363b2017-07-19 01:05:40 -070054 * A critical property of these streams is that they encode and decode in **reverse** direction.
55 * So the first bit sequence you add will be the last to be read, like a LIFO stack.
56 */
Yann Colletfa41bcc2018-06-13 14:59:26 -040057typedef struct {
Yann Colletb1f3f4b2015-10-18 22:18:32 +010058 size_t bitContainer;
Yann Colletf39a6732017-05-01 09:56:03 -070059 unsigned bitPos;
Yann Colletb1f3f4b2015-10-18 22:18:32 +010060 char* startPtr;
61 char* ptr;
62 char* endPtr;
63} BIT_CStream_t;
64
Yann Colletae7aa062016-02-03 02:46:46 +010065MEM_STATIC size_t BIT_initCStream(BIT_CStream_t* bitC, void* dstBuffer, size_t dstCapacity);
Yann Colletb1f3f4b2015-10-18 22:18:32 +010066MEM_STATIC void BIT_addBits(BIT_CStream_t* bitC, size_t value, unsigned nbBits);
67MEM_STATIC void BIT_flushBits(BIT_CStream_t* bitC);
68MEM_STATIC size_t BIT_closeCStream(BIT_CStream_t* bitC);
69
Yann Collet01e5b952016-03-19 14:14:31 +010070/* Start with initCStream, providing the size of buffer to write into.
71* bitStream will never write outside of this buffer.
Yann Collet1032fbe2016-05-11 18:30:24 +020072* `dstCapacity` must be >= sizeof(bitD->bitContainer), otherwise @return will be an error code.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010073*
Yann Collet01e5b952016-03-19 14:14:31 +010074* bits are first added to a local register.
75* Local register is size_t, hence 64-bits on 64-bits systems, or 32-bits on 32-bits systems.
76* Writing data into memory is an explicit operation, performed by the flushBits function.
77* Hence keep track how many bits are potentially stored into local register to avoid register overflow.
78* After a flushBits, a maximum of 7 bits might still be stored into local register.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010079*
Yann Collet01e5b952016-03-19 14:14:31 +010080* Avoid storing elements of more than 24 bits if you want compatibility with 32-bits bitstream readers.
Yann Colletb1f3f4b2015-10-18 22:18:32 +010081*
Yann Collet01e5b952016-03-19 14:14:31 +010082* Last operation is to close the bitStream.
83* The function returns the final size of CStream in bytes.
84* If data couldn't fit into `dstBuffer`, it will return a 0 ( == not storable)
Yann Colletb1f3f4b2015-10-18 22:18:32 +010085*/
86
87
Yann Colletae7aa062016-02-03 02:46:46 +010088/*-********************************************
89* bitStream decoding API (read backward)
Yann Colletb1f3f4b2015-10-18 22:18:32 +010090**********************************************/
Yann Colletfa41bcc2018-06-13 14:59:26 -040091typedef struct {
Yann Colletb1f3f4b2015-10-18 22:18:32 +010092 size_t bitContainer;
93 unsigned bitsConsumed;
94 const char* ptr;
95 const char* start;
Yann Colletf39a6732017-05-01 09:56:03 -070096 const char* limitPtr;
Yann Colletb1f3f4b2015-10-18 22:18:32 +010097} BIT_DStream_t;
98
99typedef enum { BIT_DStream_unfinished = 0,
100 BIT_DStream_endOfBuffer = 1,
101 BIT_DStream_completed = 2,
102 BIT_DStream_overflow = 3 } BIT_DStream_status; /* result of BIT_reloadDStream() */
103 /* 1,2,4,8 would be better for bitmap combinations, but slows down performance a bit ... :( */
104
105MEM_STATIC size_t BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize);
106MEM_STATIC size_t BIT_readBits(BIT_DStream_t* bitD, unsigned nbBits);
107MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD);
108MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* bitD);
109
110
Yann Collet01e5b952016-03-19 14:14:31 +0100111/* Start by invoking BIT_initDStream().
112* A chunk of the bitStream is then stored into a local register.
113* Local register size is 64-bits on 64-bits systems, 32-bits on 32-bits systems (size_t).
114* You can then retrieve bitFields stored into the local register, **in reverse order**.
115* Local register is explicitly reloaded from memory by the BIT_reloadDStream() method.
Yann Collet1032fbe2016-05-11 18:30:24 +0200116* A reload guarantee a minimum of ((8*sizeof(bitD->bitContainer))-7) bits when its result is BIT_DStream_unfinished.
Yann Collet01e5b952016-03-19 14:14:31 +0100117* Otherwise, it can be less than that, so proceed accordingly.
Yann Colletb21ce152016-03-24 01:27:55 +0100118* Checking if DStream has reached its end can be performed with BIT_endOfDStream().
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100119*/
120
121
Yann Colletae7aa062016-02-03 02:46:46 +0100122/*-****************************************
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100123* unsafe API
124******************************************/
125MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC, size_t value, unsigned nbBits);
126/* faster, but works only if value is "clean", meaning all high bits above nbBits are 0 */
127
128MEM_STATIC void BIT_flushBitsFast(BIT_CStream_t* bitC);
129/* unsafe version; does not check buffer overflow */
130
131MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, unsigned nbBits);
132/* faster, but works only if nbBits >= 1 */
133
134
135
Yann Colletae7aa062016-02-03 02:46:46 +0100136/*-**************************************************************
Yann Collet6cf45da2016-03-23 14:18:37 +0100137* Internal functions
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100138****************************************************************/
Yann Colletc173dbd2017-12-04 17:57:42 -0800139MEM_STATIC unsigned BIT_highbit32 (U32 val)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100140{
Stella Laue50ed1f2017-08-22 11:55:42 -0700141 assert(val != 0);
142 {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100143# if defined(_MSC_VER) /* Visual */
Stella Laue50ed1f2017-08-22 11:55:42 -0700144 unsigned long r=0;
Bimba Shresthadba3abc2020-03-05 12:20:59 -0800145 return _BitScanReverse ( &r, val ) ? (unsigned)r : 0;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100146# elif defined(__GNUC__) && (__GNUC__ >= 3) /* Use GCC Intrinsic */
Dávid Bolvanský1f7228c2019-09-23 21:23:09 +0200147 return __builtin_clz (val) ^ 31;
Joseph Chen3855bc42019-07-29 15:20:37 +0800148# elif defined(__ICCARM__) /* IAR Intrinsic */
149 return 31 - __CLZ(val);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100150# else /* Software version */
Stella Laue50ed1f2017-08-22 11:55:42 -0700151 static const unsigned DeBruijnClz[32] = { 0, 9, 1, 10, 13, 21, 2, 29,
152 11, 14, 16, 18, 22, 25, 3, 30,
153 8, 12, 20, 28, 15, 17, 24, 7,
154 19, 27, 23, 6, 26, 5, 4, 31 };
155 U32 v = val;
156 v |= v >> 1;
157 v |= v >> 2;
158 v |= v >> 4;
159 v |= v >> 8;
160 v |= v >> 16;
161 return DeBruijnClz[ (U32) (v * 0x07C4ACDDU) >> 27];
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100162# endif
Stella Laue50ed1f2017-08-22 11:55:42 -0700163 }
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100164}
165
Yann Collet6cf45da2016-03-23 14:18:37 +0100166/*===== Local Constants =====*/
Nick Terrell74718d72017-09-15 17:44:09 -0700167static const unsigned BIT_mask[] = {
168 0, 1, 3, 7, 0xF, 0x1F,
169 0x3F, 0x7F, 0xFF, 0x1FF, 0x3FF, 0x7FF,
170 0xFFF, 0x1FFF, 0x3FFF, 0x7FFF, 0xFFFF, 0x1FFFF,
171 0x3FFFF, 0x7FFFF, 0xFFFFF, 0x1FFFFF, 0x3FFFFF, 0x7FFFFF,
172 0xFFFFFF, 0x1FFFFFF, 0x3FFFFFF, 0x7FFFFFF, 0xFFFFFFF, 0x1FFFFFFF,
173 0x3FFFFFFF, 0x7FFFFFFF}; /* up to 31 bits */
174#define BIT_MASK_SIZE (sizeof(BIT_mask) / sizeof(BIT_mask[0]))
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100175
Yann Colletae7aa062016-02-03 02:46:46 +0100176/*-**************************************************************
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100177* bitStream encoding
178****************************************************************/
Yann Collet01e5b952016-03-19 14:14:31 +0100179/*! BIT_initCStream() :
Yann Colletf39a6732017-05-01 09:56:03 -0700180 * `dstCapacity` must be > sizeof(size_t)
Yann Collet01e5b952016-03-19 14:14:31 +0100181 * @return : 0 if success,
Yann Colletb71363b2017-07-19 01:05:40 -0700182 * otherwise an error code (can be tested using ERR_isError()) */
Yann Colletf39a6732017-05-01 09:56:03 -0700183MEM_STATIC size_t BIT_initCStream(BIT_CStream_t* bitC,
Yann Collet33c38b02017-05-01 11:12:30 -0700184 void* startPtr, size_t dstCapacity)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100185{
186 bitC->bitContainer = 0;
187 bitC->bitPos = 0;
188 bitC->startPtr = (char*)startPtr;
189 bitC->ptr = bitC->startPtr;
Yann Colletf39a6732017-05-01 09:56:03 -0700190 bitC->endPtr = bitC->startPtr + dstCapacity - sizeof(bitC->bitContainer);
191 if (dstCapacity <= sizeof(bitC->bitContainer)) return ERROR(dstSize_tooSmall);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100192 return 0;
193}
194
Yann Collet01e5b952016-03-19 14:14:31 +0100195/*! BIT_addBits() :
Nick Terrell74718d72017-09-15 17:44:09 -0700196 * can add up to 31 bits into `bitC`.
Yann Colletb71363b2017-07-19 01:05:40 -0700197 * Note : does not check for register overflow ! */
Yann Colletf39a6732017-05-01 09:56:03 -0700198MEM_STATIC void BIT_addBits(BIT_CStream_t* bitC,
Yann Collet33c38b02017-05-01 11:12:30 -0700199 size_t value, unsigned nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100200{
Nick Terrell74718d72017-09-15 17:44:09 -0700201 MEM_STATIC_ASSERT(BIT_MASK_SIZE == 32);
202 assert(nbBits < BIT_MASK_SIZE);
203 assert(nbBits + bitC->bitPos < sizeof(bitC->bitContainer) * 8);
Yann Collet6cf45da2016-03-23 14:18:37 +0100204 bitC->bitContainer |= (value & BIT_mask[nbBits]) << bitC->bitPos;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100205 bitC->bitPos += nbBits;
206}
207
Yann Colletd1d210f2016-03-19 12:12:07 +0100208/*! BIT_addBitsFast() :
Yann Colletfa41bcc2018-06-13 14:59:26 -0400209 * works only if `value` is _clean_,
210 * meaning all high bits above nbBits are 0 */
Yann Colletf39a6732017-05-01 09:56:03 -0700211MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC,
Yann Collet33c38b02017-05-01 11:12:30 -0700212 size_t value, unsigned nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100213{
Yann Collet202082f2017-04-28 16:56:39 -0700214 assert((value>>nbBits) == 0);
Nick Terrell74718d72017-09-15 17:44:09 -0700215 assert(nbBits + bitC->bitPos < sizeof(bitC->bitContainer) * 8);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100216 bitC->bitContainer |= value << bitC->bitPos;
217 bitC->bitPos += nbBits;
218}
219
Yann Colletd1d210f2016-03-19 12:12:07 +0100220/*! BIT_flushBitsFast() :
Yann Colletf39a6732017-05-01 09:56:03 -0700221 * assumption : bitContainer has not overflowed
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100222 * unsafe version; does not check buffer overflow */
223MEM_STATIC void BIT_flushBitsFast(BIT_CStream_t* bitC)
224{
Yann Colletd64f4352016-03-21 00:07:42 +0100225 size_t const nbBytes = bitC->bitPos >> 3;
Nick Terrell74718d72017-09-15 17:44:09 -0700226 assert(bitC->bitPos < sizeof(bitC->bitContainer) * 8);
Bimba Shrestha43da5bf2019-09-12 14:43:50 -0700227 assert(bitC->ptr <= bitC->endPtr);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100228 MEM_writeLEST(bitC->ptr, bitC->bitContainer);
229 bitC->ptr += nbBytes;
230 bitC->bitPos &= 7;
Yann Colletf39a6732017-05-01 09:56:03 -0700231 bitC->bitContainer >>= nbBytes*8;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100232}
233
Yann Collet01e5b952016-03-19 14:14:31 +0100234/*! BIT_flushBits() :
Yann Colletf39a6732017-05-01 09:56:03 -0700235 * assumption : bitContainer has not overflowed
Yann Collet01e5b952016-03-19 14:14:31 +0100236 * safe version; check for buffer overflow, and prevents it.
Yann Collet33c38b02017-05-01 11:12:30 -0700237 * note : does not signal buffer overflow.
238 * overflow will be revealed later on using BIT_closeCStream() */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100239MEM_STATIC void BIT_flushBits(BIT_CStream_t* bitC)
240{
Yann Colletd64f4352016-03-21 00:07:42 +0100241 size_t const nbBytes = bitC->bitPos >> 3;
Nick Terrell74718d72017-09-15 17:44:09 -0700242 assert(bitC->bitPos < sizeof(bitC->bitContainer) * 8);
Bimba Shresthafe9af332019-09-12 15:35:27 -0700243 assert(bitC->ptr <= bitC->endPtr);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100244 MEM_writeLEST(bitC->ptr, bitC->bitContainer);
245 bitC->ptr += nbBytes;
246 if (bitC->ptr > bitC->endPtr) bitC->ptr = bitC->endPtr;
247 bitC->bitPos &= 7;
Yann Collet33c38b02017-05-01 11:12:30 -0700248 bitC->bitContainer >>= nbBytes*8;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100249}
250
Yann Colletd1d210f2016-03-19 12:12:07 +0100251/*! BIT_closeCStream() :
Yann Collet01e5b952016-03-19 14:14:31 +0100252 * @return : size of CStream, in bytes,
Yann Colletb71363b2017-07-19 01:05:40 -0700253 * or 0 if it could not fit into dstBuffer */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100254MEM_STATIC size_t BIT_closeCStream(BIT_CStream_t* bitC)
255{
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100256 BIT_addBitsFast(bitC, 1, 1); /* endMark */
257 BIT_flushBits(bitC);
Yann Collet33c38b02017-05-01 11:12:30 -0700258 if (bitC->ptr >= bitC->endPtr) return 0; /* overflow detected */
Yann Collet01e5b952016-03-19 14:14:31 +0100259 return (bitC->ptr - bitC->startPtr) + (bitC->bitPos > 0);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100260}
261
262
Yann Colletae7aa062016-02-03 02:46:46 +0100263/*-********************************************************
Yann Colletb71363b2017-07-19 01:05:40 -0700264* bitStream decoding
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100265**********************************************************/
Yann Collet01e5b952016-03-19 14:14:31 +0100266/*! BIT_initDStream() :
Yann Colletb71363b2017-07-19 01:05:40 -0700267 * Initialize a BIT_DStream_t.
268 * `bitD` : a pointer to an already allocated BIT_DStream_t structure.
269 * `srcSize` must be the *exact* size of the bitStream, in bytes.
270 * @return : size of stream (== srcSize), or an errorCode if a problem is detected
271 */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100272MEM_STATIC size_t BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize)
273{
274 if (srcSize < 1) { memset(bitD, 0, sizeof(*bitD)); return ERROR(srcSize_wrong); }
275
Yann Colletf39a6732017-05-01 09:56:03 -0700276 bitD->start = (const char*)srcBuffer;
277 bitD->limitPtr = bitD->start + sizeof(bitD->bitContainer);
278
Yann Collet1032fbe2016-05-11 18:30:24 +0200279 if (srcSize >= sizeof(bitD->bitContainer)) { /* normal case */
Yann Collet1032fbe2016-05-11 18:30:24 +0200280 bitD->ptr = (const char*)srcBuffer + srcSize - sizeof(bitD->bitContainer);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100281 bitD->bitContainer = MEM_readLEST(bitD->ptr);
Yann Colletb21ce152016-03-24 01:27:55 +0100282 { BYTE const lastByte = ((const BYTE*)srcBuffer)[srcSize-1];
Yann Collet5397a662016-12-13 15:21:06 +0100283 bitD->bitsConsumed = lastByte ? 8 - BIT_highbit32(lastByte) : 0; /* ensures bitsConsumed is always set */
Yann Collet18c8f792016-06-12 22:51:52 +0200284 if (lastByte == 0) return ERROR(GENERIC); /* endMark not present */ }
Yann Colletae7aa062016-02-03 02:46:46 +0100285 } else {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100286 bitD->ptr = bitD->start;
Yann Collet1ceb5a92016-05-12 13:50:13 +0200287 bitD->bitContainer = *(const BYTE*)(bitD->start);
288 switch(srcSize)
289 {
Yann Colletb71363b2017-07-19 01:05:40 -0700290 case 7: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[6]) << (sizeof(bitD->bitContainer)*8 - 16);
291 /* fall-through */
Jos Collin05286fd2017-05-09 08:36:05 +0530292
Yann Colletb71363b2017-07-19 01:05:40 -0700293 case 6: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[5]) << (sizeof(bitD->bitContainer)*8 - 24);
294 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700295
Yann Colletb71363b2017-07-19 01:05:40 -0700296 case 5: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[4]) << (sizeof(bitD->bitContainer)*8 - 32);
297 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700298
Yann Colletb71363b2017-07-19 01:05:40 -0700299 case 4: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[3]) << 24;
300 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700301
Yann Colletb71363b2017-07-19 01:05:40 -0700302 case 3: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[2]) << 16;
303 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700304
Yann Colletb71363b2017-07-19 01:05:40 -0700305 case 2: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[1]) << 8;
306 /* fall-through */
Yann Collet58e8d792017-06-02 18:20:48 -0700307
Yann Colletb71363b2017-07-19 01:05:40 -0700308 default: break;
Yann Collet1ceb5a92016-05-12 13:50:13 +0200309 }
Yann Colletb71363b2017-07-19 01:05:40 -0700310 { BYTE const lastByte = ((const BYTE*)srcBuffer)[srcSize-1];
311 bitD->bitsConsumed = lastByte ? 8 - BIT_highbit32(lastByte) : 0;
312 if (lastByte == 0) return ERROR(corruption_detected); /* endMark not present */
313 }
Yann Collet1032fbe2016-05-11 18:30:24 +0200314 bitD->bitsConsumed += (U32)(sizeof(bitD->bitContainer) - srcSize)*8;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100315 }
316
317 return srcSize;
318}
319
Yann Collet1032fbe2016-05-11 18:30:24 +0200320MEM_STATIC size_t BIT_getUpperBits(size_t bitContainer, U32 const start)
Yann Collet3c017862016-03-23 14:09:51 +0100321{
Yann Collet1032fbe2016-05-11 18:30:24 +0200322 return bitContainer >> start;
Yann Collet3c017862016-03-23 14:09:51 +0100323}
324
Yann Collet1032fbe2016-05-11 18:30:24 +0200325MEM_STATIC size_t BIT_getMiddleBits(size_t bitContainer, U32 const start, U32 const nbBits)
Yann Collet3c017862016-03-23 14:09:51 +0100326{
Yann Collet6ed3b522018-10-10 18:26:44 -0700327 U32 const regMask = sizeof(bitContainer)*8 - 1;
328 /* if start > regMask, bitstream is corrupted, and result is undefined */
Nick Terrell74718d72017-09-15 17:44:09 -0700329 assert(nbBits < BIT_MASK_SIZE);
Yann Collet6ed3b522018-10-10 18:26:44 -0700330 return (bitContainer >> (start & regMask)) & BIT_mask[nbBits];
Yann Collet3c017862016-03-23 14:09:51 +0100331}
332
Yann Collet1032fbe2016-05-11 18:30:24 +0200333MEM_STATIC size_t BIT_getLowerBits(size_t bitContainer, U32 const nbBits)
Yann Colletafab0202016-03-23 13:57:49 +0100334{
Nick Terrell74718d72017-09-15 17:44:09 -0700335 assert(nbBits < BIT_MASK_SIZE);
Yann Collet1032fbe2016-05-11 18:30:24 +0200336 return bitContainer & BIT_mask[nbBits];
Yann Colletafab0202016-03-23 13:57:49 +0100337}
338
Yann Collet01e5b952016-03-19 14:14:31 +0100339/*! BIT_lookBits() :
340 * Provides next n bits from local register.
Yann Collet1032fbe2016-05-11 18:30:24 +0200341 * local register is not modified.
Yann Collet01e5b952016-03-19 14:14:31 +0100342 * On 32-bits, maxNbBits==24.
343 * On 64-bits, maxNbBits==56.
Yann Colletb71363b2017-07-19 01:05:40 -0700344 * @return : value extracted */
345MEM_STATIC size_t BIT_lookBits(const BIT_DStream_t* bitD, U32 nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100346{
Yann Collet7791f192018-10-10 16:36:11 -0700347 /* arbitrate between double-shift and shift+mask */
Yann Colletd3ec2332018-10-10 15:48:43 -0700348#if 1
Yann Collet7791f192018-10-10 16:36:11 -0700349 /* if bitD->bitsConsumed + nbBits > sizeof(bitD->bitContainer)*8,
350 * bitstream is likely corrupted, and result is undefined */
Yann Collet1032fbe2016-05-11 18:30:24 +0200351 return BIT_getMiddleBits(bitD->bitContainer, (sizeof(bitD->bitContainer)*8) - bitD->bitsConsumed - nbBits, nbBits);
Yann Collet862a8592016-03-23 18:45:23 +0100352#else
Yann Collet7791f192018-10-10 16:36:11 -0700353 /* this code path is slower on my os-x laptop */
Yann Colletf39a6732017-05-01 09:56:03 -0700354 U32 const regMask = sizeof(bitD->bitContainer)*8 - 1;
355 return ((bitD->bitContainer << (bitD->bitsConsumed & regMask)) >> 1) >> ((regMask-nbBits) & regMask);
Yann Collet862a8592016-03-23 18:45:23 +0100356#endif
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100357}
358
Yann Collet01e5b952016-03-19 14:14:31 +0100359/*! BIT_lookBitsFast() :
Yann Collet202082f2017-04-28 16:56:39 -0700360 * unsafe version; only works if nbBits >= 1 */
Yann Colletadd08d62016-03-23 01:32:41 +0100361MEM_STATIC size_t BIT_lookBitsFast(const BIT_DStream_t* bitD, U32 nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100362{
Yann Colletf39a6732017-05-01 09:56:03 -0700363 U32 const regMask = sizeof(bitD->bitContainer)*8 - 1;
Yann Collet202082f2017-04-28 16:56:39 -0700364 assert(nbBits >= 1);
Yann Colletf39a6732017-05-01 09:56:03 -0700365 return (bitD->bitContainer << (bitD->bitsConsumed & regMask)) >> (((regMask+1)-nbBits) & regMask);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100366}
367
368MEM_STATIC void BIT_skipBits(BIT_DStream_t* bitD, U32 nbBits)
369{
370 bitD->bitsConsumed += nbBits;
371}
372
Yann Collet01e5b952016-03-19 14:14:31 +0100373/*! BIT_readBits() :
Yann Colletb21ce152016-03-24 01:27:55 +0100374 * Read (consume) next n bits from local register and update.
375 * Pay attention to not read more than nbBits contained into local register.
Yann Colletb71363b2017-07-19 01:05:40 -0700376 * @return : extracted value. */
Yann Colletededcfc2018-12-21 16:19:44 -0800377MEM_STATIC size_t BIT_readBits(BIT_DStream_t* bitD, unsigned nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100378{
Yann Colletafab0202016-03-23 13:57:49 +0100379 size_t const value = BIT_lookBits(bitD, nbBits);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100380 BIT_skipBits(bitD, nbBits);
381 return value;
382}
383
Yann Collet01e5b952016-03-19 14:14:31 +0100384/*! BIT_readBitsFast() :
Yann Colletb71363b2017-07-19 01:05:40 -0700385 * unsafe version; only works only if nbBits >= 1 */
Yann Colletededcfc2018-12-21 16:19:44 -0800386MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, unsigned nbBits)
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100387{
Yann Colletafab0202016-03-23 13:57:49 +0100388 size_t const value = BIT_lookBitsFast(bitD, nbBits);
Yann Collet202082f2017-04-28 16:56:39 -0700389 assert(nbBits >= 1);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100390 BIT_skipBits(bitD, nbBits);
391 return value;
392}
393
Nick Terrell718f00f2019-11-25 18:26:19 -0800394/*! BIT_reloadDStreamFast() :
395 * Similar to BIT_reloadDStream(), but with two differences:
396 * 1. bitsConsumed <= sizeof(bitD->bitContainer)*8 must hold!
397 * 2. Returns BIT_DStream_overflow when bitD->ptr < bitD->limitPtr, at this
398 * point you must use BIT_reloadDStream() to reload.
399 */
400MEM_STATIC BIT_DStream_status BIT_reloadDStreamFast(BIT_DStream_t* bitD)
401{
402 if (UNLIKELY(bitD->ptr < bitD->limitPtr))
403 return BIT_DStream_overflow;
404 assert(bitD->bitsConsumed <= sizeof(bitD->bitContainer)*8);
405 bitD->ptr -= bitD->bitsConsumed >> 3;
406 bitD->bitsConsumed &= 7;
407 bitD->bitContainer = MEM_readLEST(bitD->ptr);
408 return BIT_DStream_unfinished;
409}
410
Yann Collet01e5b952016-03-19 14:14:31 +0100411/*! BIT_reloadDStream() :
Yann Colletb71363b2017-07-19 01:05:40 -0700412 * Refill `bitD` from buffer previously set in BIT_initDStream() .
413 * This function is safe, it guarantees it will not read beyond src buffer.
414 * @return : status of `BIT_DStream_t` internal register.
Baldur Karlsson430a2fe2018-03-13 20:02:21 +0000415 * when status == BIT_DStream_unfinished, internal register is filled with at least 25 or 57 bits */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100416MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD)
417{
Yann Colletf39a6732017-05-01 09:56:03 -0700418 if (bitD->bitsConsumed > (sizeof(bitD->bitContainer)*8)) /* overflow detected, like end of stream */
Nick Terrell5152fb22017-03-29 18:51:58 -0700419 return BIT_DStream_overflow;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100420
Yann Colletf39a6732017-05-01 09:56:03 -0700421 if (bitD->ptr >= bitD->limitPtr) {
Nick Terrell718f00f2019-11-25 18:26:19 -0800422 return BIT_reloadDStreamFast(bitD);
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100423 }
Yann Colletae7aa062016-02-03 02:46:46 +0100424 if (bitD->ptr == bitD->start) {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100425 if (bitD->bitsConsumed < sizeof(bitD->bitContainer)*8) return BIT_DStream_endOfBuffer;
426 return BIT_DStream_completed;
427 }
Yann Colletf39a6732017-05-01 09:56:03 -0700428 /* start < ptr < limitPtr */
Yann Collet01e5b952016-03-19 14:14:31 +0100429 { U32 nbBytes = bitD->bitsConsumed >> 3;
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100430 BIT_DStream_status result = BIT_DStream_unfinished;
Yann Colletae7aa062016-02-03 02:46:46 +0100431 if (bitD->ptr - nbBytes < bitD->start) {
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100432 nbBytes = (U32)(bitD->ptr - bitD->start); /* ptr > start */
433 result = BIT_DStream_endOfBuffer;
434 }
435 bitD->ptr -= nbBytes;
436 bitD->bitsConsumed -= nbBytes*8;
Yann Colletf39a6732017-05-01 09:56:03 -0700437 bitD->bitContainer = MEM_readLEST(bitD->ptr); /* reminder : srcSize > sizeof(bitD->bitContainer), otherwise bitD->ptr == bitD->start */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100438 return result;
439 }
440}
441
Yann Colletd1d210f2016-03-19 12:12:07 +0100442/*! BIT_endOfDStream() :
Yann Colletb71363b2017-07-19 01:05:40 -0700443 * @return : 1 if DStream has _exactly_ reached its end (all bits consumed).
444 */
Yann Colletb1f3f4b2015-10-18 22:18:32 +0100445MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* DStream)
446{
447 return ((DStream->ptr == DStream->start) && (DStream->bitsConsumed == sizeof(DStream->bitContainer)*8));
448}
449
450#if defined (__cplusplus)
451}
452#endif
453
454#endif /* BITSTREAM_H_MODULE */