blob: f786c105473519cb79c5937a8570d253371b003a [file] [log] [blame]
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +00001/*
2 * jdhuff.c
3 *
noel@chromium.org3395bcc2014-04-14 06:56:00 +00004 * This file was part of the Independent JPEG Group's software:
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +00005 * Copyright (C) 1991-1997, Thomas G. Lane.
noel@chromium.org3395bcc2014-04-14 06:56:00 +00006 * libjpeg-turbo Modifications:
Jonathan Wrightdb870df2020-08-05 11:42:22 +01007 * Copyright (C) 2009-2011, 2016, 2018-2019, D. R. Commander.
Jonathan Wrightbbb82822020-11-25 13:36:43 +00008 * Copyright (C) 2018, Matthias Räncker.
Tom Hudson0d47d2d2016-05-04 13:22:56 -04009 * For conditions of distribution and use, see the accompanying README.ijg
10 * file.
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000011 *
12 * This file contains Huffman entropy decoding routines.
13 *
14 * Much of the complexity here has to do with supporting input suspension.
15 * If the data source module demands suspension, we want to be able to back
16 * up to the start of the current MCU. To do this, we copy state variables
17 * into local working storage, and update them back to the permanent
18 * storage only upon successful completion of an MCU.
Chris Blumecca8c4d2019-03-01 01:09:50 -080019 *
20 * NOTE: All referenced figures are from
21 * Recommendation ITU-T T.81 (1992) | ISO/IEC 10918-1:1994.
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000022 */
23
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000024#define JPEG_INTERNALS
25#include "jinclude.h"
26#include "jpeglib.h"
Tom Hudson0d47d2d2016-05-04 13:22:56 -040027#include "jdhuff.h" /* Declarations shared with jdphuff.c */
hbono@chromium.org98626972011-08-03 03:13:08 +000028#include "jpegcomp.h"
Tom Hudson0d47d2d2016-05-04 13:22:56 -040029#include "jstdhuff.c"
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000030
31
32/*
33 * Expanded entropy decoder object for Huffman decoding.
34 *
35 * The savable_state subrecord contains fields that change within an MCU,
36 * but must not be updated permanently until we complete the MCU.
37 */
38
39typedef struct {
40 int last_dc_val[MAX_COMPS_IN_SCAN]; /* last DC coef for each component */
41} savable_state;
42
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000043typedef struct {
44 struct jpeg_entropy_decoder pub; /* public fields */
45
46 /* These fields are loaded into local variables at start of each MCU.
47 * In case of suspension, we exit WITHOUT updating them.
48 */
Tom Hudson0d47d2d2016-05-04 13:22:56 -040049 bitread_perm_state bitstate; /* Bit buffer at start of MCU */
50 savable_state saved; /* Other state at start of MCU */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000051
52 /* These fields are NOT loaded into local working state. */
Tom Hudson0d47d2d2016-05-04 13:22:56 -040053 unsigned int restarts_to_go; /* MCUs left in this restart interval */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000054
55 /* Pointers to derived tables (these workspaces have image lifespan) */
Tom Hudson0d47d2d2016-05-04 13:22:56 -040056 d_derived_tbl *dc_derived_tbls[NUM_HUFF_TBLS];
57 d_derived_tbl *ac_derived_tbls[NUM_HUFF_TBLS];
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000058
59 /* Precalculated info set up by start_pass for use in decode_mcu: */
60
61 /* Pointers to derived tables to be used for each block within an MCU */
Tom Hudson0d47d2d2016-05-04 13:22:56 -040062 d_derived_tbl *dc_cur_tbls[D_MAX_BLOCKS_IN_MCU];
63 d_derived_tbl *ac_cur_tbls[D_MAX_BLOCKS_IN_MCU];
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000064 /* Whether we care about the DC and AC coefficient values for each block */
65 boolean dc_needed[D_MAX_BLOCKS_IN_MCU];
66 boolean ac_needed[D_MAX_BLOCKS_IN_MCU];
67} huff_entropy_decoder;
68
Tom Hudson0d47d2d2016-05-04 13:22:56 -040069typedef huff_entropy_decoder *huff_entropy_ptr;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000070
71
72/*
73 * Initialize for a Huffman-compressed scan.
74 */
75
76METHODDEF(void)
Chris Blumecca8c4d2019-03-01 01:09:50 -080077start_pass_huff_decoder(j_decompress_ptr cinfo)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000078{
Chris Blumecca8c4d2019-03-01 01:09:50 -080079 huff_entropy_ptr entropy = (huff_entropy_ptr)cinfo->entropy;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000080 int ci, blkn, dctbl, actbl;
Tom Hudson0d47d2d2016-05-04 13:22:56 -040081 d_derived_tbl **pdtbl;
82 jpeg_component_info *compptr;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000083
84 /* Check that the scan parameters Ss, Se, Ah/Al are OK for sequential JPEG.
85 * This ought to be an error condition, but we make it a warning because
86 * there are some baseline files out there with all zeroes in these bytes.
87 */
Chris Blumecca8c4d2019-03-01 01:09:50 -080088 if (cinfo->Ss != 0 || cinfo->Se != DCTSIZE2 - 1 ||
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +000089 cinfo->Ah != 0 || cinfo->Al != 0)
90 WARNMS(cinfo, JWRN_NOT_SEQUENTIAL);
91
92 for (ci = 0; ci < cinfo->comps_in_scan; ci++) {
93 compptr = cinfo->cur_comp_info[ci];
94 dctbl = compptr->dc_tbl_no;
95 actbl = compptr->ac_tbl_no;
96 /* Compute derived values for Huffman tables */
97 /* We may do this more than once for a table, but it's not expensive */
Chris Blumecca8c4d2019-03-01 01:09:50 -080098 pdtbl = (d_derived_tbl **)(entropy->dc_derived_tbls) + dctbl;
Tom Hudson0d47d2d2016-05-04 13:22:56 -040099 jpeg_make_d_derived_tbl(cinfo, TRUE, dctbl, pdtbl);
Chris Blumecca8c4d2019-03-01 01:09:50 -0800100 pdtbl = (d_derived_tbl **)(entropy->ac_derived_tbls) + actbl;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400101 jpeg_make_d_derived_tbl(cinfo, FALSE, actbl, pdtbl);
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000102 /* Initialize DC predictions to 0 */
103 entropy->saved.last_dc_val[ci] = 0;
104 }
105
106 /* Precalculate decoding info for each block in an MCU of this scan */
107 for (blkn = 0; blkn < cinfo->blocks_in_MCU; blkn++) {
108 ci = cinfo->MCU_membership[blkn];
109 compptr = cinfo->cur_comp_info[ci];
110 /* Precalculate which table to use for each block */
111 entropy->dc_cur_tbls[blkn] = entropy->dc_derived_tbls[compptr->dc_tbl_no];
112 entropy->ac_cur_tbls[blkn] = entropy->ac_derived_tbls[compptr->ac_tbl_no];
113 /* Decide whether we really care about the coefficient values */
114 if (compptr->component_needed) {
115 entropy->dc_needed[blkn] = TRUE;
116 /* we don't need the ACs if producing a 1/8th-size image */
hbono@chromium.org98626972011-08-03 03:13:08 +0000117 entropy->ac_needed[blkn] = (compptr->_DCT_scaled_size > 1);
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000118 } else {
119 entropy->dc_needed[blkn] = entropy->ac_needed[blkn] = FALSE;
120 }
121 }
122
123 /* Initialize bitread state variables */
124 entropy->bitstate.bits_left = 0;
125 entropy->bitstate.get_buffer = 0; /* unnecessary, but keeps Purify quiet */
126 entropy->pub.insufficient_data = FALSE;
127
128 /* Initialize restart counter */
129 entropy->restarts_to_go = cinfo->restart_interval;
130}
131
132
133/*
134 * Compute the derived values for a Huffman table.
135 * This routine also performs some validation checks on the table.
136 *
137 * Note this is also used by jdphuff.c.
138 */
139
140GLOBAL(void)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800141jpeg_make_d_derived_tbl(j_decompress_ptr cinfo, boolean isDC, int tblno,
142 d_derived_tbl **pdtbl)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000143{
144 JHUFF_TBL *htbl;
145 d_derived_tbl *dtbl;
146 int p, i, l, si, numsymbols;
147 int lookbits, ctr;
148 char huffsize[257];
149 unsigned int huffcode[257];
150 unsigned int code;
151
152 /* Note that huffsize[] and huffcode[] are filled in code-length order,
153 * paralleling the order of the symbols themselves in htbl->huffval[].
154 */
155
156 /* Find the input Huffman table */
157 if (tblno < 0 || tblno >= NUM_HUFF_TBLS)
158 ERREXIT1(cinfo, JERR_NO_HUFF_TABLE, tblno);
159 htbl =
160 isDC ? cinfo->dc_huff_tbl_ptrs[tblno] : cinfo->ac_huff_tbl_ptrs[tblno];
161 if (htbl == NULL)
162 ERREXIT1(cinfo, JERR_NO_HUFF_TABLE, tblno);
163
164 /* Allocate a workspace if we haven't already done so. */
165 if (*pdtbl == NULL)
166 *pdtbl = (d_derived_tbl *)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800167 (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400168 sizeof(d_derived_tbl));
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000169 dtbl = *pdtbl;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400170 dtbl->pub = htbl; /* fill in back link */
171
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000172 /* Figure C.1: make table of Huffman code length for each symbol */
173
174 p = 0;
175 for (l = 1; l <= 16; l++) {
Chris Blumecca8c4d2019-03-01 01:09:50 -0800176 i = (int)htbl->bits[l];
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400177 if (i < 0 || p + i > 256) /* protect against table overrun */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000178 ERREXIT(cinfo, JERR_BAD_HUFF_TABLE);
179 while (i--)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800180 huffsize[p++] = (char)l;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000181 }
182 huffsize[p] = 0;
183 numsymbols = p;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400184
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000185 /* Figure C.2: generate the codes themselves */
186 /* We also validate that the counts represent a legal Huffman code tree. */
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400187
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000188 code = 0;
189 si = huffsize[0];
190 p = 0;
191 while (huffsize[p]) {
Chris Blumecca8c4d2019-03-01 01:09:50 -0800192 while (((int)huffsize[p]) == si) {
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000193 huffcode[p++] = code;
194 code++;
195 }
196 /* code is now 1 more than the last code used for codelength si; but
197 * it must still fit in si bits, since no code is allowed to be all ones.
198 */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800199 if (((JLONG)code) >= (((JLONG)1) << si))
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000200 ERREXIT(cinfo, JERR_BAD_HUFF_TABLE);
201 code <<= 1;
202 si++;
203 }
204
205 /* Figure F.15: generate decoding tables for bit-sequential decoding */
206
207 p = 0;
208 for (l = 1; l <= 16; l++) {
209 if (htbl->bits[l]) {
210 /* valoffset[l] = huffval[] index of 1st symbol of code length l,
211 * minus the minimum code of length l
212 */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800213 dtbl->valoffset[l] = (JLONG)p - (JLONG)huffcode[p];
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000214 p += htbl->bits[l];
Chris Blumecca8c4d2019-03-01 01:09:50 -0800215 dtbl->maxcode[l] = huffcode[p - 1]; /* maximum code of length l */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000216 } else {
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400217 dtbl->maxcode[l] = -1; /* -1 if no codes of this length */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000218 }
219 }
220 dtbl->valoffset[17] = 0;
221 dtbl->maxcode[17] = 0xFFFFFL; /* ensures jpeg_huff_decode terminates */
222
223 /* Compute lookahead tables to speed up decoding.
224 * First we set all the table entries to 0, indicating "too long";
225 * then we iterate through the Huffman codes that are short enough and
226 * fill in all the entries that correspond to bit sequences starting
227 * with that code.
228 */
229
Chris Blumecca8c4d2019-03-01 01:09:50 -0800230 for (i = 0; i < (1 << HUFF_LOOKAHEAD); i++)
231 dtbl->lookup[i] = (HUFF_LOOKAHEAD + 1) << HUFF_LOOKAHEAD;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000232
233 p = 0;
234 for (l = 1; l <= HUFF_LOOKAHEAD; l++) {
Chris Blumecca8c4d2019-03-01 01:09:50 -0800235 for (i = 1; i <= (int)htbl->bits[l]; i++, p++) {
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000236 /* l = current code's length, p = its index in huffcode[] & huffval[]. */
237 /* Generate left-justified code followed by all possible bit sequences */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800238 lookbits = huffcode[p] << (HUFF_LOOKAHEAD - l);
239 for (ctr = 1 << (HUFF_LOOKAHEAD - l); ctr > 0; ctr--) {
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400240 dtbl->lookup[lookbits] = (l << HUFF_LOOKAHEAD) | htbl->huffval[p];
241 lookbits++;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000242 }
243 }
244 }
245
246 /* Validate symbols as being reasonable.
247 * For AC tables, we make no check, but accept all byte values 0..255.
248 * For DC tables, we require the symbols to be in range 0..15.
249 * (Tighter bounds could be applied depending on the data depth and mode,
250 * but this is sufficient to ensure safe decoding.)
251 */
252 if (isDC) {
253 for (i = 0; i < numsymbols; i++) {
254 int sym = htbl->huffval[i];
255 if (sym < 0 || sym > 15)
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400256 ERREXIT(cinfo, JERR_BAD_HUFF_TABLE);
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000257 }
258 }
259}
260
261
262/*
263 * Out-of-line code for bit fetching (shared with jdphuff.c).
264 * See jdhuff.h for info about usage.
265 * Note: current values of get_buffer and bits_left are passed as parameters,
266 * but are returned in the corresponding fields of the state struct.
267 *
268 * On most machines MIN_GET_BITS should be 25 to allow the full 32-bit width
269 * of get_buffer to be used. (On machines with wider words, an even larger
270 * buffer could be used.) However, on some machines 32-bit shifts are
271 * quite slow and take time proportional to the number of places shifted.
272 * (This is true with most PC compilers, for instance.) In this case it may
273 * be a win to set MIN_GET_BITS to the minimum value of 15. This reduces the
274 * average shift distance at the cost of more calls to jpeg_fill_bit_buffer.
275 */
276
277#ifdef SLOW_SHIFT_32
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400278#define MIN_GET_BITS 15 /* minimum allowable value */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000279#else
Chris Blumecca8c4d2019-03-01 01:09:50 -0800280#define MIN_GET_BITS (BIT_BUF_SIZE - 7)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000281#endif
282
283
284GLOBAL(boolean)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800285jpeg_fill_bit_buffer(bitread_working_state *state,
286 register bit_buf_type get_buffer, register int bits_left,
287 int nbits)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000288/* Load up the bit buffer to a depth of at least nbits */
289{
290 /* Copy heavily used state fields into locals (hopefully registers) */
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400291 register const JOCTET *next_input_byte = state->next_input_byte;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000292 register size_t bytes_in_buffer = state->bytes_in_buffer;
293 j_decompress_ptr cinfo = state->cinfo;
294
295 /* Attempt to load at least MIN_GET_BITS bits into get_buffer. */
296 /* (It is assumed that no request will be for more than that many bits.) */
297 /* We fail to do so only if we hit a marker or are forced to suspend. */
298
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400299 if (cinfo->unread_marker == 0) { /* cannot advance past a marker */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000300 while (bits_left < MIN_GET_BITS) {
301 register int c;
302
303 /* Attempt to read a byte */
304 if (bytes_in_buffer == 0) {
Chris Blumecca8c4d2019-03-01 01:09:50 -0800305 if (!(*cinfo->src->fill_input_buffer) (cinfo))
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400306 return FALSE;
307 next_input_byte = cinfo->src->next_input_byte;
308 bytes_in_buffer = cinfo->src->bytes_in_buffer;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000309 }
310 bytes_in_buffer--;
Jonathan Wrightbbb82822020-11-25 13:36:43 +0000311 c = *next_input_byte++;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000312
313 /* If it's 0xFF, check and discard stuffed zero byte */
314 if (c == 0xFF) {
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400315 /* Loop here to discard any padding FF's on terminating marker,
316 * so that we can save a valid unread_marker value. NOTE: we will
317 * accept multiple FF's followed by a 0 as meaning a single FF data
318 * byte. This data pattern is not valid according to the standard.
319 */
320 do {
321 if (bytes_in_buffer == 0) {
Chris Blumecca8c4d2019-03-01 01:09:50 -0800322 if (!(*cinfo->src->fill_input_buffer) (cinfo))
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400323 return FALSE;
324 next_input_byte = cinfo->src->next_input_byte;
325 bytes_in_buffer = cinfo->src->bytes_in_buffer;
326 }
327 bytes_in_buffer--;
Jonathan Wrightbbb82822020-11-25 13:36:43 +0000328 c = *next_input_byte++;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400329 } while (c == 0xFF);
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000330
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400331 if (c == 0) {
332 /* Found FF/00, which represents an FF data byte */
333 c = 0xFF;
334 } else {
335 /* Oops, it's actually a marker indicating end of compressed data.
336 * Save the marker code for later use.
337 * Fine point: it might appear that we should save the marker into
338 * bitread working state, not straight into permanent state. But
339 * once we have hit a marker, we cannot need to suspend within the
340 * current MCU, because we will read no more bytes from the data
341 * source. So it is OK to update permanent state right away.
342 */
343 cinfo->unread_marker = c;
344 /* See if we need to insert some fake zero bits. */
345 goto no_more_bytes;
346 }
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000347 }
348
349 /* OK, load c into get_buffer */
350 get_buffer = (get_buffer << 8) | c;
351 bits_left += 8;
352 } /* end while */
353 } else {
Chris Blumecca8c4d2019-03-01 01:09:50 -0800354no_more_bytes:
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000355 /* We get here if we've read the marker that terminates the compressed
356 * data segment. There should be enough bits in the buffer register
357 * to satisfy the request; if so, no problem.
358 */
359 if (nbits > bits_left) {
360 /* Uh-oh. Report corrupted data to user and stuff zeroes into
361 * the data stream, so that we can produce some kind of image.
362 * We use a nonvolatile flag to ensure that only one warning message
363 * appears per data segment.
364 */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800365 if (!cinfo->entropy->insufficient_data) {
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400366 WARNMS(cinfo, JWRN_HIT_MARKER);
367 cinfo->entropy->insufficient_data = TRUE;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000368 }
369 /* Fill the buffer with zero bits */
370 get_buffer <<= MIN_GET_BITS - bits_left;
371 bits_left = MIN_GET_BITS;
372 }
373 }
374
375 /* Unload the local registers */
376 state->next_input_byte = next_input_byte;
377 state->bytes_in_buffer = bytes_in_buffer;
378 state->get_buffer = get_buffer;
379 state->bits_left = bits_left;
380
381 return TRUE;
382}
383
384
hbono@chromium.org98626972011-08-03 03:13:08 +0000385/* Macro version of the above, which performs much better but does not
386 handle markers. We have to hand off any blocks with markers to the
387 slower routines. */
388
Chris Blumecca8c4d2019-03-01 01:09:50 -0800389#define GET_BYTE { \
hbono@chromium.org98626972011-08-03 03:13:08 +0000390 register int c0, c1; \
Jonathan Wrightbbb82822020-11-25 13:36:43 +0000391 c0 = *buffer++; \
392 c1 = *buffer; \
hbono@chromium.org98626972011-08-03 03:13:08 +0000393 /* Pre-execute most common case */ \
394 get_buffer = (get_buffer << 8) | c0; \
395 bits_left += 8; \
396 if (c0 == 0xFF) { \
397 /* Pre-execute case of FF/00, which represents an FF data byte */ \
398 buffer++; \
399 if (c1 != 0) { \
400 /* Oops, it's actually a marker indicating end of compressed data. */ \
401 cinfo->unread_marker = c1; \
402 /* Back out pre-execution and fill the buffer with zero bits */ \
403 buffer -= 2; \
404 get_buffer &= ~0xFF; \
405 } \
406 } \
407}
408
Jonathan Wrightbbb82822020-11-25 13:36:43 +0000409#if SIZEOF_SIZE_T == 8 || defined(_WIN64) || (defined(__x86_64__) && defined(__ILP32__))
hbono@chromium.org98626972011-08-03 03:13:08 +0000410
411/* Pre-fetch 48 bytes, because the holding register is 64-bit */
412#define FILL_BIT_BUFFER_FAST \
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400413 if (bits_left <= 16) { \
hbono@chromium.org98626972011-08-03 03:13:08 +0000414 GET_BYTE GET_BYTE GET_BYTE GET_BYTE GET_BYTE GET_BYTE \
415 }
416
417#else
418
419/* Pre-fetch 16 bytes, because the holding register is 32-bit */
420#define FILL_BIT_BUFFER_FAST \
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400421 if (bits_left <= 16) { \
hbono@chromium.org98626972011-08-03 03:13:08 +0000422 GET_BYTE GET_BYTE \
423 }
424
425#endif
426
427
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000428/*
429 * Out-of-line code for Huffman code decoding.
430 * See jdhuff.h for info about usage.
431 */
432
433GLOBAL(int)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800434jpeg_huff_decode(bitread_working_state *state,
435 register bit_buf_type get_buffer, register int bits_left,
436 d_derived_tbl *htbl, int min_bits)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000437{
438 register int l = min_bits;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400439 register JLONG code;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000440
441 /* HUFF_DECODE has determined that the code is at least min_bits */
442 /* bits long, so fetch that many bits in one swoop. */
443
444 CHECK_BIT_BUFFER(*state, l, return -1);
445 code = GET_BITS(l);
446
447 /* Collect the rest of the Huffman code one bit at a time. */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800448 /* This is per Figure F.16. */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000449
450 while (code > htbl->maxcode[l]) {
451 code <<= 1;
452 CHECK_BIT_BUFFER(*state, 1, return -1);
453 code |= GET_BITS(1);
454 l++;
455 }
456
457 /* Unload the local registers */
458 state->get_buffer = get_buffer;
459 state->bits_left = bits_left;
460
461 /* With garbage input we may reach the sentinel value l = 17. */
462
463 if (l > 16) {
464 WARNMS(state->cinfo, JWRN_HUFF_BAD_CODE);
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400465 return 0; /* fake a zero as the safest result */
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000466 }
467
Chris Blumecca8c4d2019-03-01 01:09:50 -0800468 return htbl->pub->huffval[(int)(code + htbl->valoffset[l])];
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000469}
470
471
472/*
473 * Figure F.12: extend sign bit.
474 * On some machines, a shift and add will be faster than a table lookup.
475 */
476
477#define AVOID_TABLES
478#ifdef AVOID_TABLES
479
Chris Blumecca8c4d2019-03-01 01:09:50 -0800480#define NEG_1 ((unsigned int)-1)
481#define HUFF_EXTEND(x, s) \
482 ((x) + ((((x) - (1 << ((s) - 1))) >> 31) & (((NEG_1) << (s)) + 1)))
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000483
484#else
485
Chris Blumecca8c4d2019-03-01 01:09:50 -0800486#define HUFF_EXTEND(x, s) \
487 ((x) < extend_test[s] ? (x) + extend_offset[s] : (x))
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000488
Chris Blumecca8c4d2019-03-01 01:09:50 -0800489static const int extend_test[16] = { /* entry n is 2**(n-1) */
490 0, 0x0001, 0x0002, 0x0004, 0x0008, 0x0010, 0x0020, 0x0040, 0x0080,
491 0x0100, 0x0200, 0x0400, 0x0800, 0x1000, 0x2000, 0x4000
492};
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000493
Chris Blumecca8c4d2019-03-01 01:09:50 -0800494static const int extend_offset[16] = { /* entry n is (-1 << n) + 1 */
495 0, ((-1) << 1) + 1, ((-1) << 2) + 1, ((-1) << 3) + 1, ((-1) << 4) + 1,
496 ((-1) << 5) + 1, ((-1) << 6) + 1, ((-1) << 7) + 1, ((-1) << 8) + 1,
497 ((-1) << 9) + 1, ((-1) << 10) + 1, ((-1) << 11) + 1, ((-1) << 12) + 1,
498 ((-1) << 13) + 1, ((-1) << 14) + 1, ((-1) << 15) + 1
499};
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000500
501#endif /* AVOID_TABLES */
502
503
504/*
505 * Check for a restart marker & resynchronize decoder.
506 * Returns FALSE if must suspend.
507 */
508
509LOCAL(boolean)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800510process_restart(j_decompress_ptr cinfo)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000511{
Chris Blumecca8c4d2019-03-01 01:09:50 -0800512 huff_entropy_ptr entropy = (huff_entropy_ptr)cinfo->entropy;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000513 int ci;
514
515 /* Throw away any unused bits remaining in bit buffer; */
516 /* include any full bytes in next_marker's count of discarded bytes */
517 cinfo->marker->discarded_bytes += entropy->bitstate.bits_left / 8;
518 entropy->bitstate.bits_left = 0;
519
520 /* Advance past the RSTn marker */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800521 if (!(*cinfo->marker->read_restart_marker) (cinfo))
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000522 return FALSE;
523
524 /* Re-initialize DC predictions to 0 */
525 for (ci = 0; ci < cinfo->comps_in_scan; ci++)
526 entropy->saved.last_dc_val[ci] = 0;
527
528 /* Reset restart counter */
529 entropy->restarts_to_go = cinfo->restart_interval;
530
531 /* Reset out-of-data flag, unless read_restart_marker left us smack up
532 * against a marker. In that case we will end up treating the next data
533 * segment as empty, and we can avoid producing bogus output pixels by
534 * leaving the flag set.
535 */
536 if (cinfo->unread_marker == 0)
537 entropy->pub.insufficient_data = FALSE;
538
539 return TRUE;
540}
541
542
Jonathan Wright24e31052021-04-26 12:10:48 +0100543#if defined(__has_feature)
544#if __has_feature(undefined_behavior_sanitizer)
545__attribute__((no_sanitize("signed-integer-overflow"),
546 no_sanitize("unsigned-integer-overflow")))
547#endif
548#endif
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000549LOCAL(boolean)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800550decode_mcu_slow(j_decompress_ptr cinfo, JBLOCKROW *MCU_data)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000551{
Chris Blumecca8c4d2019-03-01 01:09:50 -0800552 huff_entropy_ptr entropy = (huff_entropy_ptr)cinfo->entropy;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000553 BITREAD_STATE_VARS;
554 int blkn;
555 savable_state state;
556 /* Outer loop handles each block in the MCU */
557
558 /* Load up working state */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800559 BITREAD_LOAD_STATE(cinfo, entropy->bitstate);
Jonathan Wrightbbb82822020-11-25 13:36:43 +0000560 state = entropy->saved;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000561
562 for (blkn = 0; blkn < cinfo->blocks_in_MCU; blkn++) {
Aaron Gablec9c87552015-08-03 09:34:32 -0700563 JBLOCKROW block = MCU_data ? MCU_data[blkn] : NULL;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400564 d_derived_tbl *dctbl = entropy->dc_cur_tbls[blkn];
565 d_derived_tbl *actbl = entropy->ac_cur_tbls[blkn];
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000566 register int s, k, r;
567
568 /* Decode a single block's worth of coefficients */
569
570 /* Section F.2.2.1: decode the DC coefficient difference */
571 HUFF_DECODE(s, br_state, dctbl, return FALSE, label1);
572 if (s) {
573 CHECK_BIT_BUFFER(br_state, s, return FALSE);
574 r = GET_BITS(s);
575 s = HUFF_EXTEND(r, s);
576 }
577
578 if (entropy->dc_needed[blkn]) {
579 /* Convert DC difference to actual value, update last_dc_val */
580 int ci = cinfo->MCU_membership[blkn];
Jonathan Wright24e31052021-04-26 12:10:48 +0100581 /* Certain malformed JPEG images produce repeated DC coefficient
582 * differences of 2047 or -2047, which causes state.last_dc_val[ci] to
583 * grow until it overflows or underflows a 32-bit signed integer. This
584 * behavior is, to the best of our understanding, innocuous, and it is
585 * unclear how to work around it without potentially affecting
586 * performance. Thus, we (hopefully temporarily) suppress UBSan integer
587 * overflow errors for this function.
Jonathan Wrightdb870df2020-08-05 11:42:22 +0100588 */
Jonathan Wright24e31052021-04-26 12:10:48 +0100589 s += state.last_dc_val[ci];
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000590 state.last_dc_val[ci] = s;
Aaron Gablec9c87552015-08-03 09:34:32 -0700591 if (block) {
592 /* Output the DC coefficient (assumes jpeg_natural_order[0] = 0) */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800593 (*block)[0] = (JCOEF)s;
Aaron Gablec9c87552015-08-03 09:34:32 -0700594 }
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000595 }
596
Aaron Gablec9c87552015-08-03 09:34:32 -0700597 if (entropy->ac_needed[blkn] && block) {
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000598
599 /* Section F.2.2.2: decode the AC coefficients */
600 /* Since zeroes are skipped, output area must be cleared beforehand */
601 for (k = 1; k < DCTSIZE2; k++) {
602 HUFF_DECODE(s, br_state, actbl, return FALSE, label2);
603
604 r = s >> 4;
605 s &= 15;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400606
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000607 if (s) {
608 k += r;
609 CHECK_BIT_BUFFER(br_state, s, return FALSE);
610 r = GET_BITS(s);
611 s = HUFF_EXTEND(r, s);
612 /* Output coefficient in natural (dezigzagged) order.
613 * Note: the extra entries in jpeg_natural_order[] will save us
614 * if k >= DCTSIZE2, which could happen if the data is corrupted.
615 */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800616 (*block)[jpeg_natural_order[k]] = (JCOEF)s;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000617 } else {
618 if (r != 15)
619 break;
620 k += 15;
621 }
622 }
623
624 } else {
625
626 /* Section F.2.2.2: decode the AC coefficients */
627 /* In this path we just discard the values */
628 for (k = 1; k < DCTSIZE2; k++) {
629 HUFF_DECODE(s, br_state, actbl, return FALSE, label3);
630
631 r = s >> 4;
632 s &= 15;
633
634 if (s) {
635 k += r;
636 CHECK_BIT_BUFFER(br_state, s, return FALSE);
637 DROP_BITS(s);
638 } else {
639 if (r != 15)
640 break;
641 k += 15;
642 }
643 }
644 }
645 }
646
647 /* Completed MCU, so update state */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800648 BITREAD_SAVE_STATE(cinfo, entropy->bitstate);
Jonathan Wrightbbb82822020-11-25 13:36:43 +0000649 entropy->saved = state;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000650 return TRUE;
651}
652
653
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000654LOCAL(boolean)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800655decode_mcu_fast(j_decompress_ptr cinfo, JBLOCKROW *MCU_data)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000656{
Chris Blumecca8c4d2019-03-01 01:09:50 -0800657 huff_entropy_ptr entropy = (huff_entropy_ptr)cinfo->entropy;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000658 BITREAD_STATE_VARS;
659 JOCTET *buffer;
660 int blkn;
661 savable_state state;
662 /* Outer loop handles each block in the MCU */
663
664 /* Load up working state */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800665 BITREAD_LOAD_STATE(cinfo, entropy->bitstate);
666 buffer = (JOCTET *)br_state.next_input_byte;
Jonathan Wrightbbb82822020-11-25 13:36:43 +0000667 state = entropy->saved;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000668
669 for (blkn = 0; blkn < cinfo->blocks_in_MCU; blkn++) {
Aaron Gable631e2dd2015-08-11 13:03:18 -0700670 JBLOCKROW block = MCU_data ? MCU_data[blkn] : NULL;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400671 d_derived_tbl *dctbl = entropy->dc_cur_tbls[blkn];
672 d_derived_tbl *actbl = entropy->ac_cur_tbls[blkn];
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000673 register int s, k, r, l;
674
Jonathan Wright24e31052021-04-26 12:10:48 +0100675 HUFF_DECODE_FAST(s, l, dctbl);
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000676 if (s) {
hbono@chromium.org98626972011-08-03 03:13:08 +0000677 FILL_BIT_BUFFER_FAST
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000678 r = GET_BITS(s);
679 s = HUFF_EXTEND(r, s);
680 }
681
682 if (entropy->dc_needed[blkn]) {
683 int ci = cinfo->MCU_membership[blkn];
Jonathan Wright24e31052021-04-26 12:10:48 +0100684 s += state.last_dc_val[ci];
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000685 state.last_dc_val[ci] = s;
Aaron Gablec9c87552015-08-03 09:34:32 -0700686 if (block)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800687 (*block)[0] = (JCOEF)s;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000688 }
689
Aaron Gablec9c87552015-08-03 09:34:32 -0700690 if (entropy->ac_needed[blkn] && block) {
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000691
692 for (k = 1; k < DCTSIZE2; k++) {
Jonathan Wright24e31052021-04-26 12:10:48 +0100693 HUFF_DECODE_FAST(s, l, actbl);
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000694 r = s >> 4;
695 s &= 15;
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400696
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000697 if (s) {
698 k += r;
hbono@chromium.org98626972011-08-03 03:13:08 +0000699 FILL_BIT_BUFFER_FAST
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000700 r = GET_BITS(s);
701 s = HUFF_EXTEND(r, s);
Chris Blumecca8c4d2019-03-01 01:09:50 -0800702 (*block)[jpeg_natural_order[k]] = (JCOEF)s;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000703 } else {
704 if (r != 15) break;
705 k += 15;
706 }
707 }
708
709 } else {
710
711 for (k = 1; k < DCTSIZE2; k++) {
Jonathan Wright24e31052021-04-26 12:10:48 +0100712 HUFF_DECODE_FAST(s, l, actbl);
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000713 r = s >> 4;
714 s &= 15;
715
716 if (s) {
717 k += r;
hbono@chromium.org98626972011-08-03 03:13:08 +0000718 FILL_BIT_BUFFER_FAST
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000719 DROP_BITS(s);
720 } else {
721 if (r != 15) break;
722 k += 15;
723 }
724 }
725 }
726 }
727
hbono@chromium.org98626972011-08-03 03:13:08 +0000728 if (cinfo->unread_marker != 0) {
729 cinfo->unread_marker = 0;
730 return FALSE;
731 }
732
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000733 br_state.bytes_in_buffer -= (buffer - br_state.next_input_byte);
734 br_state.next_input_byte = buffer;
Chris Blumecca8c4d2019-03-01 01:09:50 -0800735 BITREAD_SAVE_STATE(cinfo, entropy->bitstate);
Jonathan Wrightbbb82822020-11-25 13:36:43 +0000736 entropy->saved = state;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000737 return TRUE;
738}
739
740
741/*
742 * Decode and return one MCU's worth of Huffman-compressed coefficients.
743 * The coefficients are reordered from zigzag order into natural array order,
744 * but are not dequantized.
745 *
746 * The i'th block of the MCU is stored into the block pointed to by
747 * MCU_data[i]. WE ASSUME THIS AREA HAS BEEN ZEROED BY THE CALLER.
748 * (Wholesale zeroing is usually a little faster than retail...)
749 *
750 * Returns FALSE if data source requested suspension. In that case no
751 * changes have been made to permanent state. (Exception: some output
752 * coefficients may already have been assigned. This is harmless for
753 * this module, since we'll just re-assign them on the next call.)
754 */
755
Chris Blumecca8c4d2019-03-01 01:09:50 -0800756#define BUFSIZE (DCTSIZE2 * 8)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000757
758METHODDEF(boolean)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800759decode_mcu(j_decompress_ptr cinfo, JBLOCKROW *MCU_data)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000760{
Chris Blumecca8c4d2019-03-01 01:09:50 -0800761 huff_entropy_ptr entropy = (huff_entropy_ptr)cinfo->entropy;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000762 int usefast = 1;
763
764 /* Process restart marker if needed; may have to suspend */
765 if (cinfo->restart_interval) {
766 if (entropy->restarts_to_go == 0)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800767 if (!process_restart(cinfo))
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400768 return FALSE;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000769 usefast = 0;
770 }
771
Chris Blumecca8c4d2019-03-01 01:09:50 -0800772 if (cinfo->src->bytes_in_buffer < BUFSIZE * (size_t)cinfo->blocks_in_MCU ||
773 cinfo->unread_marker != 0)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000774 usefast = 0;
775
776 /* If we've run out of data, just leave the MCU set to zeroes.
777 * This way, we return uniform gray for the remainder of the segment.
778 */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800779 if (!entropy->pub.insufficient_data) {
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000780
781 if (usefast) {
hbono@chromium.org98626972011-08-03 03:13:08 +0000782 if (!decode_mcu_fast(cinfo, MCU_data)) goto use_slow;
Chris Blumecca8c4d2019-03-01 01:09:50 -0800783 } else {
784use_slow:
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000785 if (!decode_mcu_slow(cinfo, MCU_data)) return FALSE;
786 }
787
788 }
789
790 /* Account for restart interval (no-op if not using restarts) */
Jonathan Wright24e31052021-04-26 12:10:48 +0100791 if (cinfo->restart_interval)
792 entropy->restarts_to_go--;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000793
794 return TRUE;
795}
796
797
798/*
799 * Module initialization routine for Huffman entropy decoding.
800 */
801
802GLOBAL(void)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800803jinit_huff_decoder(j_decompress_ptr cinfo)
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000804{
805 huff_entropy_ptr entropy;
806 int i;
807
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400808 /* Motion JPEG frames typically do not include the Huffman tables if they
809 are the default tables. Thus, if the tables are not set by the time
810 the Huffman decoder is initialized (usually within the body of
811 jpeg_start_decompress()), we set them to default values. */
Chris Blumecca8c4d2019-03-01 01:09:50 -0800812 std_huff_tables((j_common_ptr)cinfo);
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400813
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000814 entropy = (huff_entropy_ptr)
Chris Blumecca8c4d2019-03-01 01:09:50 -0800815 (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
Tom Hudson0d47d2d2016-05-04 13:22:56 -0400816 sizeof(huff_entropy_decoder));
Chris Blumecca8c4d2019-03-01 01:09:50 -0800817 cinfo->entropy = (struct jpeg_entropy_decoder *)entropy;
hbono@chromium.orgf0c4f332010-11-01 05:14:55 +0000818 entropy->pub.start_pass = start_pass_huff_decoder;
819 entropy->pub.decode_mcu = decode_mcu;
820
821 /* Mark tables unallocated */
822 for (i = 0; i < NUM_HUFF_TBLS; i++) {
823 entropy->dc_derived_tbls[i] = entropy->ac_derived_tbls[i] = NULL;
824 }
825}