blob: f9abbad99a11a5fc2fa7d5525cd09f2ebe8fab89 [file] [log] [blame]
Thomas G. Lane36a4ccc1994-09-24 00:00:00 +00001/*
2 * jdmainct.c
3 *
4 * Copyright (C) 1994, Thomas G. Lane.
5 * This file is part of the Independent JPEG Group's software.
6 * For conditions of distribution and use, see the accompanying README file.
7 *
8 * This file contains the main buffer controller for decompression.
9 * The main buffer lies between the JPEG decompressor proper and the
10 * post-processor; it holds downsampled data in the JPEG colorspace.
11 */
12
13#define JPEG_INTERNALS
14#include "jinclude.h"
15#include "jpeglib.h"
16
17
18/*
19 * In the current system design, the main buffer need never be a full-image
20 * buffer; any full-height buffers will be found inside the coefficient or
21 * postprocessing controllers. Nonetheless, the main controller is not
22 * trivial. Its responsibility is to provide context rows for upsampling/
23 * rescaling, and doing this in an efficient fashion is a bit tricky.
24 *
25 * Postprocessor input data is counted in "row groups". A row group
26 * is defined to be (v_samp_factor * DCT_scaled_size / min_DCT_scaled_size)
27 * sample rows of each component. (We require DCT_scaled_size values to be
28 * chosen such that these numbers are integers. In practice DCT_scaled_size
29 * values will likely be powers of two, so we actually have the stronger
30 * condition that DCT_scaled_size / min_DCT_scaled_size is an integer.)
31 * Upsampling will typically produce max_v_samp_factor pixel rows from each
32 * row group (times any additional scale factor that the upsampler is
33 * applying).
34 *
35 * The coefficient controller will deliver data to us one iMCU row at a time;
36 * each iMCU row contains v_samp_factor * DCT_scaled_size sample rows, or
37 * exactly min_DCT_scaled_size row groups. (This amount of data corresponds
38 * to one row of MCUs when the image is fully interleaved.) Note that the
39 * number of sample rows varies across components, but the number of row
40 * groups does not. Some garbage sample rows may be included in the last iMCU
41 * row at the bottom of the image.
42 *
43 * Depending on the vertical scaling algorithm used, the upsampler may need
44 * access to the sample row(s) above and below its current input row group.
45 * The upsampler is required to set need_context_rows TRUE at global selection
46 * time if so. When need_context_rows is FALSE, this controller can simply
47 * obtain one iMCU row at a time from the coefficient controller and dole it
48 * out as row groups to the postprocessor.
49 *
50 * When need_context_rows is TRUE, this controller guarantees that the buffer
51 * passed to postprocessing contains at least one row group's worth of samples
52 * above and below the row group(s) being processed. Note that the context
53 * rows "above" the first passed row group appear at negative row offsets in
54 * the passed buffer. At the top and bottom of the image, the required
55 * context rows are manufactured by duplicating the first or last real sample
56 * row; this avoids having special cases in the upsampling inner loops.
57 *
58 * The amount of context is fixed at one row group just because that's a
59 * convenient number for this controller to work with. The existing
60 * upsamplers really only need one sample row of context. An upsampler
61 * supporting arbitrary output rescaling might wish for more than one row
62 * group of context when shrinking the image; tough, we don't handle that.
63 * (This is justified by the assumption that downsizing will be handled mostly
64 * by adjusting the DCT_scaled_size values, so that the actual scale factor at
65 * the upsample step needn't be much less than one.)
66 *
67 * To provide the desired context, we have to retain the last two row groups
68 * of one iMCU row while reading in the next iMCU row. (The last row group
69 * can't be processed until we have another row group for its below-context,
70 * and so we have to save the next-to-last group too for its above-context.)
71 * We could do this most simply by copying data around in our buffer, but
72 * that'd be very slow. We can avoid copying any data by creating a rather
73 * strange pointer structure. Here's how it works. We allocate a workspace
74 * consisting of M+2 row groups (where M = min_DCT_scaled_size is the number
75 * of row groups per iMCU row). We create two sets of redundant pointers to
76 * the workspace. Labeling the physical row groups 0 to M+1, the synthesized
77 * pointer lists look like this:
78 * M+1 M-1
79 * master pointer --> 0 master pointer --> 0
80 * 1 1
81 * ... ...
82 * M-3 M-3
83 * M-2 M
84 * M-1 M+1
85 * M M-2
86 * M+1 M-1
87 * 0 0
88 * We read alternate iMCU rows using each master pointer; thus the last two
89 * row groups of the previous iMCU row remain un-overwritten in the workspace.
90 * The pointer lists are set up so that the required context rows appear to
91 * be adjacent to the proper places when we pass the pointer lists to the
92 * upsampler.
93 *
94 * The above pictures describe the normal state of the pointer lists.
95 * At top and bottom of the image, we diddle the pointer lists to duplicate
96 * the first or last sample row as necessary (this is cheaper than copying
97 * sample rows around).
98 *
99 * This scheme breaks down if M < 2, ie, min_DCT_scaled_size is 1. In that
100 * situation each iMCU row provides only one row group so the buffering logic
101 * must be different (eg, we must read two iMCU rows before we can emit the
102 * first row group). For now, we simply do not support providing context
103 * rows when min_DCT_scaled_size is 1. That combination seems unlikely to
104 * be worth providing --- if someone wants a 1/8th-size preview, they probably
105 * want it quick and dirty, so a context-free upsampler is sufficient.
106 */
107
108
109/* Private buffer controller object */
110
111typedef struct {
112 struct jpeg_d_main_controller pub; /* public fields */
113
114 /* Pointer to allocated workspace (M or M+2 row groups). */
115 JSAMPARRAY buffer[MAX_COMPONENTS];
116
117 boolean buffer_full; /* Have we gotten an iMCU row from decoder? */
118 JDIMENSION rowgroup_ctr; /* counts row groups output to postprocessor */
119
120 /* Remaining fields are only used in the context case. */
121
122 /* These are the master pointers to the funny-order pointer lists. */
123 JSAMPIMAGE xbuffer[2]; /* pointers to weird pointer lists */
124
125 int whichptr; /* indicates which pointer set is now in use */
126 int context_state; /* process_data state machine status */
127 JDIMENSION rowgroups_avail; /* row groups available to postprocessor */
128 JDIMENSION iMCU_row_ctr; /* counts iMCU rows to detect image top/bot */
129} my_main_controller;
130
131typedef my_main_controller * my_main_ptr;
132
133/* context_state values: */
134#define CTX_PREPARE_FOR_IMCU 0 /* need to prepare for MCU row */
135#define CTX_PROCESS_IMCU 1 /* feeding iMCU to postprocessor */
136#define CTX_POSTPONED_ROW 2 /* feeding postponed row group */
137
138
139/* Forward declarations */
140METHODDEF void process_data_simple_main
141 JPP((j_decompress_ptr cinfo, JSAMPARRAY output_buf,
142 JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail));
143METHODDEF void process_data_context_main
144 JPP((j_decompress_ptr cinfo, JSAMPARRAY output_buf,
145 JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail));
146#ifdef D_MULTISCAN_FILES_SUPPORTED
147METHODDEF void process_data_input_only
148 JPP((j_decompress_ptr cinfo, JSAMPARRAY output_buf,
149 JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail));
150#endif
151#ifdef QUANT_2PASS_SUPPORTED
152METHODDEF void process_data_crank_post
153 JPP((j_decompress_ptr cinfo, JSAMPARRAY output_buf,
154 JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail));
155#endif
156
157
158LOCAL void
159make_funny_pointers (j_decompress_ptr cinfo)
160/* Create the funny pointer lists discussed in the comments above.
161 * The actual workspace is already allocated (in main->buffer),
162 * we just have to make the curiously ordered lists.
163 */
164{
165 my_main_ptr main = (my_main_ptr) cinfo->main;
166 int ci, i, rgroup;
167 int M = cinfo->min_DCT_scaled_size;
168 jpeg_component_info *compptr;
169 JSAMPARRAY buf, xbuf0, xbuf1;
170
171 /* Get top-level space for component array pointers.
172 * We alloc both arrays with one call to save a few cycles.
173 */
174 main->xbuffer[0] = (JSAMPIMAGE)
175 (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
176 cinfo->num_components * 2 * SIZEOF(JSAMPARRAY));
177 main->xbuffer[1] = main->xbuffer[0] + cinfo->num_components;
178
179 for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
180 ci++, compptr++) {
181 rgroup = (compptr->v_samp_factor * compptr->DCT_scaled_size) /
182 cinfo->min_DCT_scaled_size; /* height of a row group of component */
183 /* Get space for pointer lists --- M+4 row groups in each list.
184 * We alloc both pointer lists with one call to save a few cycles.
185 */
186 xbuf0 = (JSAMPARRAY)
187 (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
188 2 * (rgroup * (M + 4)) * SIZEOF(JSAMPROW));
189 xbuf0 += rgroup; /* want one row group at negative offsets */
190 main->xbuffer[0][ci] = xbuf0;
191 xbuf1 = xbuf0 + (rgroup * (M + 4));
192 main->xbuffer[1][ci] = xbuf1;
193 /* First copy the workspace pointers as-is */
194 buf = main->buffer[ci];
195 for (i = 0; i < rgroup * (M + 2); i++) {
196 xbuf0[i] = xbuf1[i] = buf[i];
197 }
198 /* In the second list, put the last four row groups in swapped order */
199 for (i = 0; i < rgroup * 2; i++) {
200 xbuf1[rgroup*(M-2) + i] = buf[rgroup*M + i];
201 xbuf1[rgroup*M + i] = buf[rgroup*(M-2) + i];
202 }
203 /* The wraparound pointers at top and bottom will be filled later
204 * (see set_wraparound_pointers, below). Initially we want the "above"
205 * pointers to duplicate the first actual data line. This only needs
206 * to happen in xbuffer[0].
207 */
208 for (i = 0; i < rgroup; i++) {
209 xbuf0[i - rgroup] = xbuf0[0];
210 }
211 }
212}
213
214
215LOCAL void
216set_wraparound_pointers (j_decompress_ptr cinfo)
217/* Set up the "wraparound" pointers at top and bottom of the pointer lists.
218 * This changes the pointer list state from top-of-image to the normal state.
219 */
220{
221 my_main_ptr main = (my_main_ptr) cinfo->main;
222 int ci, i, rgroup;
223 int M = cinfo->min_DCT_scaled_size;
224 jpeg_component_info *compptr;
225 JSAMPARRAY xbuf0, xbuf1;
226
227 for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
228 ci++, compptr++) {
229 rgroup = (compptr->v_samp_factor * compptr->DCT_scaled_size) /
230 cinfo->min_DCT_scaled_size; /* height of a row group of component */
231 xbuf0 = main->xbuffer[0][ci];
232 xbuf1 = main->xbuffer[1][ci];
233 for (i = 0; i < rgroup; i++) {
234 xbuf0[i - rgroup] = xbuf0[rgroup*(M+1) + i];
235 xbuf1[i - rgroup] = xbuf1[rgroup*(M+1) + i];
236 xbuf0[rgroup*(M+2) + i] = xbuf0[i];
237 xbuf1[rgroup*(M+2) + i] = xbuf1[i];
238 }
239 }
240}
241
242
243LOCAL void
244set_bottom_pointers (j_decompress_ptr cinfo)
245/* Change the pointer lists to duplicate the last sample row at the bottom
246 * of the image. whichptr indicates which xbuffer holds the final iMCU row.
247 * Also sets rowgroups_avail to indicate number of nondummy row groups in row.
248 */
249{
250 my_main_ptr main = (my_main_ptr) cinfo->main;
251 int ci, i, rgroup, iMCUheight, rows_left;
252 jpeg_component_info *compptr;
253 JSAMPARRAY xbuf;
254
255 for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
256 ci++, compptr++) {
257 /* Count sample rows in one iMCU row and in one row group */
258 iMCUheight = compptr->v_samp_factor * compptr->DCT_scaled_size;
259 rgroup = iMCUheight / cinfo->min_DCT_scaled_size;
260 /* Count nondummy sample rows remaining for this component */
261 rows_left = (int) (compptr->downsampled_height % (JDIMENSION) iMCUheight);
262 if (rows_left == 0) rows_left = iMCUheight;
263 /* Count nondummy row groups. Should get same answer for each component,
264 * so we need only do it once.
265 */
266 if (ci == 0) {
267 main->rowgroups_avail = (JDIMENSION) ((rows_left-1) / rgroup + 1);
268 }
269 /* Duplicate the last real sample row rgroup*2 times; this pads out the
270 * last partial rowgroup and ensures at least one full rowgroup of context.
271 */
272 xbuf = main->xbuffer[main->whichptr][ci];
273 for (i = 0; i < rgroup * 2; i++) {
274 xbuf[rows_left + i] = xbuf[rows_left-1];
275 }
276 }
277}
278
279
280/*
281 * Initialize for a processing pass.
282 */
283
284METHODDEF void
285start_pass_main (j_decompress_ptr cinfo, J_BUF_MODE pass_mode)
286{
287 my_main_ptr main = (my_main_ptr) cinfo->main;
288
289 /* Processing chunks are output rows except in JBUF_CRANK_SOURCE mode. */
290 main->pub.num_chunks = cinfo->output_height;
291
292 switch (pass_mode) {
293 case JBUF_PASS_THRU:
294 /* Do nothing if raw-data mode. */
295 if (cinfo->raw_data_out)
296 return;
297 if (cinfo->upsample->need_context_rows) {
298 main->pub.process_data = process_data_context_main;
299 make_funny_pointers(cinfo); /* Create the xbuffer[] lists */
300 main->whichptr = 0; /* Read first iMCU row into xbuffer[0] */
301 main->context_state = CTX_PREPARE_FOR_IMCU;
302 main->iMCU_row_ctr = 0;
303 } else {
304 /* Simple case with no context needed */
305 main->pub.process_data = process_data_simple_main;
306 }
307 main->buffer_full = FALSE; /* Mark buffer empty */
308 main->rowgroup_ctr = 0;
309 break;
310#ifdef D_MULTISCAN_FILES_SUPPORTED
311 case JBUF_CRANK_SOURCE:
312 /* Reading a multi-scan file, just crank the decompressor */
313 main->pub.process_data = process_data_input_only;
314 /* decompressor needs to be called once for each (equivalent) iMCU row */
315 main->pub.num_chunks = cinfo->total_iMCU_rows;
316 break;
317#endif
318#ifdef QUANT_2PASS_SUPPORTED
319 case JBUF_CRANK_DEST:
320 /* For last pass of 2-pass quantization, just crank the postprocessor */
321 main->pub.process_data = process_data_crank_post;
322 break;
323#endif
324 default:
325 ERREXIT(cinfo, JERR_BAD_BUFFER_MODE);
326 break;
327 }
328}
329
330
331/*
332 * Process some data.
333 * This handles the simple case where no context is required.
334 */
335
336METHODDEF void
337process_data_simple_main (j_decompress_ptr cinfo,
338 JSAMPARRAY output_buf, JDIMENSION *out_row_ctr,
339 JDIMENSION out_rows_avail)
340{
341 my_main_ptr main = (my_main_ptr) cinfo->main;
342 JDIMENSION rowgroups_avail;
343
344 /* Read input data if we haven't filled the main buffer yet */
345 if (! main->buffer_full) {
346 if (! (*cinfo->coef->decompress_data) (cinfo, main->buffer))
347 return; /* suspension forced, can do nothing more */
348 main->buffer_full = TRUE; /* OK, we have an iMCU row to work with */
349 }
350
351 /* There are always min_DCT_scaled_size row groups in an iMCU row. */
352 rowgroups_avail = (JDIMENSION) cinfo->min_DCT_scaled_size;
353 /* Note: at the bottom of the image, we may pass extra garbage row groups
354 * to the postprocessor. The postprocessor has to check for bottom
355 * of image anyway (at row resolution), so no point in us doing it too.
356 */
357
358 /* Feed the postprocessor */
359 (*cinfo->post->post_process_data) (cinfo, main->buffer,
360 &main->rowgroup_ctr, rowgroups_avail,
361 output_buf, out_row_ctr, out_rows_avail);
362
363 /* Has postprocessor consumed all the data yet? If so, mark buffer empty */
364 if (main->rowgroup_ctr >= rowgroups_avail) {
365 main->buffer_full = FALSE;
366 main->rowgroup_ctr = 0;
367 }
368}
369
370
371/*
372 * Process some data.
373 * This handles the case where context rows must be provided.
374 */
375
376METHODDEF void
377process_data_context_main (j_decompress_ptr cinfo,
378 JSAMPARRAY output_buf, JDIMENSION *out_row_ctr,
379 JDIMENSION out_rows_avail)
380{
381 my_main_ptr main = (my_main_ptr) cinfo->main;
382
383 /* Read input data if we haven't filled the main buffer yet */
384 if (! main->buffer_full) {
385 if (! (*cinfo->coef->decompress_data) (cinfo,
386 main->xbuffer[main->whichptr]))
387 return; /* suspension forced, can do nothing more */
388 main->buffer_full = TRUE; /* OK, we have an iMCU row to work with */
389 main->iMCU_row_ctr++; /* count rows received */
390 }
391
392 /* Postprocessor typically will not swallow all the input data it is handed
393 * in one call (due to filling the output buffer first). Must be prepared
394 * to exit and restart. This switch lets us keep track of how far we got.
395 * Note that each case falls through to the next on successful completion.
396 */
397 switch (main->context_state) {
398 case CTX_POSTPONED_ROW:
399 /* Call postprocessor using previously set pointers for postponed row */
400 (*cinfo->post->post_process_data) (cinfo, main->xbuffer[main->whichptr],
401 &main->rowgroup_ctr, main->rowgroups_avail,
402 output_buf, out_row_ctr, out_rows_avail);
403 if (main->rowgroup_ctr < main->rowgroups_avail)
404 return; /* Need to suspend */
405 main->context_state = CTX_PREPARE_FOR_IMCU;
406 if (*out_row_ctr >= out_rows_avail)
407 return; /* Postprocessor exactly filled output buf */
408 /*FALLTHROUGH*/
409 case CTX_PREPARE_FOR_IMCU:
410 /* Prepare to process first M-1 row groups of this iMCU row */
411 main->rowgroup_ctr = 0;
412 main->rowgroups_avail = (JDIMENSION) (cinfo->min_DCT_scaled_size - 1);
413 /* Check for bottom of image: if so, tweak pointers to "duplicate"
414 * the last sample row, and adjust rowgroups_avail to ignore padding rows.
415 */
416 if (main->iMCU_row_ctr == cinfo->total_iMCU_rows)
417 set_bottom_pointers(cinfo);
418 main->context_state = CTX_PROCESS_IMCU;
419 /*FALLTHROUGH*/
420 case CTX_PROCESS_IMCU:
421 /* Call postprocessor using previously set pointers */
422 (*cinfo->post->post_process_data) (cinfo, main->xbuffer[main->whichptr],
423 &main->rowgroup_ctr, main->rowgroups_avail,
424 output_buf, out_row_ctr, out_rows_avail);
425 if (main->rowgroup_ctr < main->rowgroups_avail)
426 return; /* Need to suspend */
427 /* After the first iMCU, change wraparound pointers to normal state */
428 if (main->iMCU_row_ctr == 1)
429 set_wraparound_pointers(cinfo);
430 /* Prepare to load new iMCU row using other xbuffer list */
431 main->whichptr ^= 1; /* 0=>1 or 1=>0 */
432 main->buffer_full = FALSE;
433 /* Still need to process last row group of this iMCU row, */
434 /* which is saved at index M+1 of the other xbuffer */
435 main->rowgroup_ctr = (JDIMENSION) (cinfo->min_DCT_scaled_size + 1);
436 main->rowgroups_avail = (JDIMENSION) (cinfo->min_DCT_scaled_size + 2);
437 main->context_state = CTX_POSTPONED_ROW;
438 }
439}
440
441
442/*
443 * Process some data.
444 * Initial passes in a multiple-scan file: just call the decompressor,
445 * which will save data in its internal buffer, but return nothing.
446 */
447
448#ifdef D_MULTISCAN_FILES_SUPPORTED
449
450METHODDEF void
451process_data_input_only (j_decompress_ptr cinfo,
452 JSAMPARRAY output_buf, JDIMENSION *out_row_ctr,
453 JDIMENSION out_rows_avail)
454{
455 if (! (*cinfo->coef->decompress_data) (cinfo, (JSAMPIMAGE) NULL))
456 return; /* suspension forced, can do nothing more */
457 *out_row_ctr += 1; /* OK, we did one iMCU row */
458}
459
460#endif /* D_MULTISCAN_FILES_SUPPORTED */
461
462
463/*
464 * Process some data.
465 * Final pass of two-pass quantization: just call the postprocessor.
466 * Source data will be the postprocessor controller's internal buffer.
467 */
468
469#ifdef QUANT_2PASS_SUPPORTED
470
471METHODDEF void
472process_data_crank_post (j_decompress_ptr cinfo,
473 JSAMPARRAY output_buf, JDIMENSION *out_row_ctr,
474 JDIMENSION out_rows_avail)
475{
476 (*cinfo->post->post_process_data) (cinfo, (JSAMPIMAGE) NULL,
477 (JDIMENSION *) NULL, (JDIMENSION) 0,
478 output_buf, out_row_ctr, out_rows_avail);
479}
480
481#endif /* QUANT_2PASS_SUPPORTED */
482
483
484/*
485 * Initialize main buffer controller.
486 */
487
488GLOBAL void
489jinit_d_main_controller (j_decompress_ptr cinfo, boolean need_full_buffer)
490{
491 my_main_ptr main;
492 int ci, rgroup, ngroups;
493 jpeg_component_info *compptr;
494
495 main = (my_main_ptr)
496 (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
497 SIZEOF(my_main_controller));
498 cinfo->main = (struct jpeg_d_main_controller *) main;
499 main->pub.start_pass = start_pass_main;
500
501 if (need_full_buffer) /* shouldn't happen */
502 ERREXIT(cinfo, JERR_BAD_BUFFER_MODE);
503
504 /* In raw-data mode, we don't need a workspace. This module doesn't
505 * do anything useful in that mode, except pass calls through to the
506 * coef controller in CRANK_SOURCE mode (ie, reading a multiscan file).
507 */
508 if (cinfo->raw_data_out)
509 return;
510
511 /* Allocate the workspace.
512 * ngroups is the number of row groups we need.
513 */
514 if (cinfo->upsample->need_context_rows) {
515 if (cinfo->min_DCT_scaled_size < 2) /* unsupported, see comments above */
516 ERREXIT(cinfo, JERR_NOTIMPL);
517 ngroups = cinfo->min_DCT_scaled_size + 2;
518 } else {
519 ngroups = cinfo->min_DCT_scaled_size;
520 }
521
522 for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
523 ci++, compptr++) {
524 rgroup = (compptr->v_samp_factor * compptr->DCT_scaled_size) /
525 cinfo->min_DCT_scaled_size; /* height of a row group of component */
526 main->buffer[ci] = (*cinfo->mem->alloc_sarray)
527 ((j_common_ptr) cinfo, JPOOL_IMAGE,
528 compptr->width_in_blocks * compptr->DCT_scaled_size,
529 (JDIMENSION) (rgroup * ngroups));
530 }
531}