1 /*
2 * jdsample.c
3 *
4 * This file was part of the Independent JPEG Group's software:
5 * Copyright (C) 1991-1996, Thomas G. Lane.
6 * libjpeg-turbo Modifications:
7 * Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
8 * Copyright (C) 2010, 2015-2016, D. R. Commander.
9 * Copyright (C) 2014, MIPS Technologies, Inc., California.
10 * Copyright (C) 2015, Google, Inc.
11 * For conditions of distribution and use, see the accompanying README.ijg
12 * file.
13 *
14 * This file contains upsampling routines.
15 *
16 * Upsampling input data is counted in "row groups". A row group
17 * is defined to be (v_samp_factor * DCT_scaled_size / min_DCT_scaled_size)
18 * sample rows of each component. Upsampling will normally produce
19 * max_v_samp_factor pixel rows from each row group (but this could vary
20 * if the upsampler is applying a scale factor of its own).
21 *
22 * An excellent reference for image resampling is
23 * Digital Image Warping, George Wolberg, 1990.
24 * Pub. by IEEE Computer Society Press, Los Alamitos, CA. ISBN 0-8186-8944-7.
25 */
26
27 #include "jinclude.h"
28 #include "jdsample.h"
29 #include "jsimd.h"
30 #include "jpegcomp.h"
31
32
33
34 /*
35 * Initialize for an upsampling pass.
36 */
37
38 METHODDEF(void)
start_pass_upsample(j_decompress_ptr cinfo)39 start_pass_upsample (j_decompress_ptr cinfo)
40 {
41 my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
42
43 /* Mark the conversion buffer empty */
44 upsample->next_row_out = cinfo->max_v_samp_factor;
45 /* Initialize total-height counter for detecting bottom of image */
46 upsample->rows_to_go = cinfo->output_height;
47 }
48
49
50 /*
51 * Control routine to do upsampling (and color conversion).
52 *
53 * In this version we upsample each component independently.
54 * We upsample one row group into the conversion buffer, then apply
55 * color conversion a row at a time.
56 */
57
58 METHODDEF(void)
sep_upsample(j_decompress_ptr cinfo,JSAMPIMAGE input_buf,JDIMENSION * in_row_group_ctr,JDIMENSION in_row_groups_avail,JSAMPARRAY output_buf,JDIMENSION * out_row_ctr,JDIMENSION out_rows_avail)59 sep_upsample (j_decompress_ptr cinfo,
60 JSAMPIMAGE input_buf, JDIMENSION *in_row_group_ctr,
61 JDIMENSION in_row_groups_avail,
62 JSAMPARRAY output_buf, JDIMENSION *out_row_ctr,
63 JDIMENSION out_rows_avail)
64 {
65 my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
66 int ci;
67 jpeg_component_info *compptr;
68 JDIMENSION num_rows;
69
70 /* Fill the conversion buffer, if it's empty */
71 if (upsample->next_row_out >= cinfo->max_v_samp_factor) {
72 for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
73 ci++, compptr++) {
74 /* Invoke per-component upsample method. Notice we pass a POINTER
75 * to color_buf[ci], so that fullsize_upsample can change it.
76 */
77 (*upsample->methods[ci]) (cinfo, compptr,
78 input_buf[ci] + (*in_row_group_ctr * upsample->rowgroup_height[ci]),
79 upsample->color_buf + ci);
80 }
81 upsample->next_row_out = 0;
82 }
83
84 /* Color-convert and emit rows */
85
86 /* How many we have in the buffer: */
87 num_rows = (JDIMENSION) (cinfo->max_v_samp_factor - upsample->next_row_out);
88 /* Not more than the distance to the end of the image. Need this test
89 * in case the image height is not a multiple of max_v_samp_factor:
90 */
91 if (num_rows > upsample->rows_to_go)
92 num_rows = upsample->rows_to_go;
93 /* And not more than what the client can accept: */
94 out_rows_avail -= *out_row_ctr;
95 if (num_rows > out_rows_avail)
96 num_rows = out_rows_avail;
97
98 (*cinfo->cconvert->color_convert) (cinfo, upsample->color_buf,
99 (JDIMENSION) upsample->next_row_out,
100 output_buf + *out_row_ctr,
101 (int) num_rows);
102
103 /* Adjust counts */
104 *out_row_ctr += num_rows;
105 upsample->rows_to_go -= num_rows;
106 upsample->next_row_out += num_rows;
107 /* When the buffer is emptied, declare this input row group consumed */
108 if (upsample->next_row_out >= cinfo->max_v_samp_factor)
109 (*in_row_group_ctr)++;
110 }
111
112
113 /*
114 * These are the routines invoked by sep_upsample to upsample pixel values
115 * of a single component. One row group is processed per call.
116 */
117
118
119 /*
120 * For full-size components, we just make color_buf[ci] point at the
121 * input buffer, and thus avoid copying any data. Note that this is
122 * safe only because sep_upsample doesn't declare the input row group
123 * "consumed" until we are done color converting and emitting it.
124 */
125
126 METHODDEF(void)
fullsize_upsample(j_decompress_ptr cinfo,jpeg_component_info * compptr,JSAMPARRAY input_data,JSAMPARRAY * output_data_ptr)127 fullsize_upsample (j_decompress_ptr cinfo, jpeg_component_info *compptr,
128 JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
129 {
130 *output_data_ptr = input_data;
131 }
132
133
134 /*
135 * This is a no-op version used for "uninteresting" components.
136 * These components will not be referenced by color conversion.
137 */
138
139 METHODDEF(void)
noop_upsample(j_decompress_ptr cinfo,jpeg_component_info * compptr,JSAMPARRAY input_data,JSAMPARRAY * output_data_ptr)140 noop_upsample (j_decompress_ptr cinfo, jpeg_component_info *compptr,
141 JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
142 {
143 *output_data_ptr = NULL; /* safety check */
144 }
145
146
147 /*
148 * This version handles any integral sampling ratios.
149 * This is not used for typical JPEG files, so it need not be fast.
150 * Nor, for that matter, is it particularly accurate: the algorithm is
151 * simple replication of the input pixel onto the corresponding output
152 * pixels. The hi-falutin sampling literature refers to this as a
153 * "box filter". A box filter tends to introduce visible artifacts,
154 * so if you are actually going to use 3:1 or 4:1 sampling ratios
155 * you would be well advised to improve this code.
156 */
157
158 METHODDEF(void)
int_upsample(j_decompress_ptr cinfo,jpeg_component_info * compptr,JSAMPARRAY input_data,JSAMPARRAY * output_data_ptr)159 int_upsample (j_decompress_ptr cinfo, jpeg_component_info *compptr,
160 JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
161 {
162 my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
163 JSAMPARRAY output_data = *output_data_ptr;
164 register JSAMPROW inptr, outptr;
165 register JSAMPLE invalue;
166 register int h;
167 JSAMPROW outend;
168 int h_expand, v_expand;
169 int inrow, outrow;
170
171 h_expand = upsample->h_expand[compptr->component_index];
172 v_expand = upsample->v_expand[compptr->component_index];
173
174 inrow = outrow = 0;
175 while (outrow < cinfo->max_v_samp_factor) {
176 /* Generate one output row with proper horizontal expansion */
177 inptr = input_data[inrow];
178 outptr = output_data[outrow];
179 outend = outptr + cinfo->output_width;
180 while (outptr < outend) {
181 invalue = *inptr++; /* don't need GETJSAMPLE() here */
182 for (h = h_expand; h > 0; h--) {
183 *outptr++ = invalue;
184 }
185 }
186 /* Generate any additional output rows by duplicating the first one */
187 if (v_expand > 1) {
188 jcopy_sample_rows(output_data, outrow, output_data, outrow+1,
189 v_expand-1, cinfo->output_width);
190 }
191 inrow++;
192 outrow += v_expand;
193 }
194 }
195
196
197 /*
198 * Fast processing for the common case of 2:1 horizontal and 1:1 vertical.
199 * It's still a box filter.
200 */
201
202 METHODDEF(void)
h2v1_upsample(j_decompress_ptr cinfo,jpeg_component_info * compptr,JSAMPARRAY input_data,JSAMPARRAY * output_data_ptr)203 h2v1_upsample (j_decompress_ptr cinfo, jpeg_component_info *compptr,
204 JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
205 {
206 JSAMPARRAY output_data = *output_data_ptr;
207 register JSAMPROW inptr, outptr;
208 register JSAMPLE invalue;
209 JSAMPROW outend;
210 int inrow;
211
212 for (inrow = 0; inrow < cinfo->max_v_samp_factor; inrow++) {
213 inptr = input_data[inrow];
214 outptr = output_data[inrow];
215 outend = outptr + cinfo->output_width;
216 while (outptr < outend) {
217 invalue = *inptr++; /* don't need GETJSAMPLE() here */
218 *outptr++ = invalue;
219 *outptr++ = invalue;
220 }
221 }
222 }
223
224
225 /*
226 * Fast processing for the common case of 2:1 horizontal and 2:1 vertical.
227 * It's still a box filter.
228 */
229
230 METHODDEF(void)
h2v2_upsample(j_decompress_ptr cinfo,jpeg_component_info * compptr,JSAMPARRAY input_data,JSAMPARRAY * output_data_ptr)231 h2v2_upsample (j_decompress_ptr cinfo, jpeg_component_info *compptr,
232 JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
233 {
234 JSAMPARRAY output_data = *output_data_ptr;
235 register JSAMPROW inptr, outptr;
236 register JSAMPLE invalue;
237 JSAMPROW outend;
238 int inrow, outrow;
239
240 inrow = outrow = 0;
241 while (outrow < cinfo->max_v_samp_factor) {
242 inptr = input_data[inrow];
243 outptr = output_data[outrow];
244 outend = outptr + cinfo->output_width;
245 while (outptr < outend) {
246 invalue = *inptr++; /* don't need GETJSAMPLE() here */
247 *outptr++ = invalue;
248 *outptr++ = invalue;
249 }
250 jcopy_sample_rows(output_data, outrow, output_data, outrow+1,
251 1, cinfo->output_width);
252 inrow++;
253 outrow += 2;
254 }
255 }
256
257
258 /*
259 * Fancy processing for the common case of 2:1 horizontal and 1:1 vertical.
260 *
261 * The upsampling algorithm is linear interpolation between pixel centers,
262 * also known as a "triangle filter". This is a good compromise between
263 * speed and visual quality. The centers of the output pixels are 1/4 and 3/4
264 * of the way between input pixel centers.
265 *
266 * A note about the "bias" calculations: when rounding fractional values to
267 * integer, we do not want to always round 0.5 up to the next integer.
268 * If we did that, we'd introduce a noticeable bias towards larger values.
269 * Instead, this code is arranged so that 0.5 will be rounded up or down at
270 * alternate pixel locations (a simple ordered dither pattern).
271 */
272
273 METHODDEF(void)
h2v1_fancy_upsample(j_decompress_ptr cinfo,jpeg_component_info * compptr,JSAMPARRAY input_data,JSAMPARRAY * output_data_ptr)274 h2v1_fancy_upsample (j_decompress_ptr cinfo, jpeg_component_info *compptr,
275 JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
276 {
277 JSAMPARRAY output_data = *output_data_ptr;
278 register JSAMPROW inptr, outptr;
279 register int invalue;
280 register JDIMENSION colctr;
281 int inrow;
282
283 for (inrow = 0; inrow < cinfo->max_v_samp_factor; inrow++) {
284 inptr = input_data[inrow];
285 outptr = output_data[inrow];
286 /* Special case for first column */
287 invalue = GETJSAMPLE(*inptr++);
288 *outptr++ = (JSAMPLE) invalue;
289 *outptr++ = (JSAMPLE) ((invalue * 3 + GETJSAMPLE(*inptr) + 2) >> 2);
290
291 for (colctr = compptr->downsampled_width - 2; colctr > 0; colctr--) {
292 /* General case: 3/4 * nearer pixel + 1/4 * further pixel */
293 invalue = GETJSAMPLE(*inptr++) * 3;
294 *outptr++ = (JSAMPLE) ((invalue + GETJSAMPLE(inptr[-2]) + 1) >> 2);
295 *outptr++ = (JSAMPLE) ((invalue + GETJSAMPLE(*inptr) + 2) >> 2);
296 }
297
298 /* Special case for last column */
299 invalue = GETJSAMPLE(*inptr);
300 *outptr++ = (JSAMPLE) ((invalue * 3 + GETJSAMPLE(inptr[-1]) + 1) >> 2);
301 *outptr++ = (JSAMPLE) invalue;
302 }
303 }
304
305
306 /*
307 * Fancy processing for 1:1 horizontal and 2:1 vertical (4:4:0 subsampling).
308 *
309 * This is a less common case, but it can be encountered when losslessly
310 * rotating/transposing a JPEG file that uses 4:2:2 chroma subsampling.
311 */
312
313 METHODDEF(void)
h1v2_fancy_upsample(j_decompress_ptr cinfo,jpeg_component_info * compptr,JSAMPARRAY input_data,JSAMPARRAY * output_data_ptr)314 h1v2_fancy_upsample (j_decompress_ptr cinfo, jpeg_component_info *compptr,
315 JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
316 {
317 JSAMPARRAY output_data = *output_data_ptr;
318 JSAMPROW inptr0, inptr1, outptr;
319 #if BITS_IN_JSAMPLE == 8
320 int thiscolsum;
321 #else
322 JLONG thiscolsum;
323 #endif
324 JDIMENSION colctr;
325 int inrow, outrow, v;
326
327 inrow = outrow = 0;
328 while (outrow < cinfo->max_v_samp_factor) {
329 for (v = 0; v < 2; v++) {
330 /* inptr0 points to nearest input row, inptr1 points to next nearest */
331 inptr0 = input_data[inrow];
332 if (v == 0) /* next nearest is row above */
333 inptr1 = input_data[inrow-1];
334 else /* next nearest is row below */
335 inptr1 = input_data[inrow+1];
336 outptr = output_data[outrow++];
337
338 for(colctr = 0; colctr < compptr->downsampled_width; colctr++) {
339 thiscolsum = GETJSAMPLE(*inptr0++) * 3 + GETJSAMPLE(*inptr1++);
340 *outptr++ = (JSAMPLE) ((thiscolsum + 1) >> 2);
341 }
342 }
343 inrow++;
344 }
345 }
346
347
348 /*
349 * Fancy processing for the common case of 2:1 horizontal and 2:1 vertical.
350 * Again a triangle filter; see comments for h2v1 case, above.
351 *
352 * It is OK for us to reference the adjacent input rows because we demanded
353 * context from the main buffer controller (see initialization code).
354 */
355
356 METHODDEF(void)
h2v2_fancy_upsample(j_decompress_ptr cinfo,jpeg_component_info * compptr,JSAMPARRAY input_data,JSAMPARRAY * output_data_ptr)357 h2v2_fancy_upsample (j_decompress_ptr cinfo, jpeg_component_info *compptr,
358 JSAMPARRAY input_data, JSAMPARRAY *output_data_ptr)
359 {
360 JSAMPARRAY output_data = *output_data_ptr;
361 register JSAMPROW inptr0, inptr1, outptr;
362 #if BITS_IN_JSAMPLE == 8
363 register int thiscolsum, lastcolsum, nextcolsum;
364 #else
365 register JLONG thiscolsum, lastcolsum, nextcolsum;
366 #endif
367 register JDIMENSION colctr;
368 int inrow, outrow, v;
369
370 inrow = outrow = 0;
371 while (outrow < cinfo->max_v_samp_factor) {
372 for (v = 0; v < 2; v++) {
373 /* inptr0 points to nearest input row, inptr1 points to next nearest */
374 inptr0 = input_data[inrow];
375 if (v == 0) /* next nearest is row above */
376 inptr1 = input_data[inrow-1];
377 else /* next nearest is row below */
378 inptr1 = input_data[inrow+1];
379 outptr = output_data[outrow++];
380
381 /* Special case for first column */
382 thiscolsum = GETJSAMPLE(*inptr0++) * 3 + GETJSAMPLE(*inptr1++);
383 nextcolsum = GETJSAMPLE(*inptr0++) * 3 + GETJSAMPLE(*inptr1++);
384 *outptr++ = (JSAMPLE) ((thiscolsum * 4 + 8) >> 4);
385 *outptr++ = (JSAMPLE) ((thiscolsum * 3 + nextcolsum + 7) >> 4);
386 lastcolsum = thiscolsum; thiscolsum = nextcolsum;
387
388 for (colctr = compptr->downsampled_width - 2; colctr > 0; colctr--) {
389 /* General case: 3/4 * nearer pixel + 1/4 * further pixel in each */
390 /* dimension, thus 9/16, 3/16, 3/16, 1/16 overall */
391 nextcolsum = GETJSAMPLE(*inptr0++) * 3 + GETJSAMPLE(*inptr1++);
392 *outptr++ = (JSAMPLE) ((thiscolsum * 3 + lastcolsum + 8) >> 4);
393 *outptr++ = (JSAMPLE) ((thiscolsum * 3 + nextcolsum + 7) >> 4);
394 lastcolsum = thiscolsum; thiscolsum = nextcolsum;
395 }
396
397 /* Special case for last column */
398 *outptr++ = (JSAMPLE) ((thiscolsum * 3 + lastcolsum + 8) >> 4);
399 *outptr++ = (JSAMPLE) ((thiscolsum * 4 + 7) >> 4);
400 }
401 inrow++;
402 }
403 }
404
405
406 /*
407 * Module initialization routine for upsampling.
408 */
409
410 GLOBAL(void)
jinit_upsampler(j_decompress_ptr cinfo)411 jinit_upsampler (j_decompress_ptr cinfo)
412 {
413 my_upsample_ptr upsample;
414 int ci;
415 jpeg_component_info *compptr;
416 boolean need_buffer, do_fancy;
417 int h_in_group, v_in_group, h_out_group, v_out_group;
418
419 if (!cinfo->master->jinit_upsampler_no_alloc) {
420 upsample = (my_upsample_ptr)
421 (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
422 sizeof(my_upsampler));
423 cinfo->upsample = (struct jpeg_upsampler *) upsample;
424 upsample->pub.start_pass = start_pass_upsample;
425 upsample->pub.upsample = sep_upsample;
426 upsample->pub.need_context_rows = FALSE; /* until we find out differently */
427 } else
428 upsample = (my_upsample_ptr) cinfo->upsample;
429
430 if (cinfo->CCIR601_sampling) /* this isn't supported */
431 ERREXIT(cinfo, JERR_CCIR601_NOTIMPL);
432
433 /* jdmainct.c doesn't support context rows when min_DCT_scaled_size = 1,
434 * so don't ask for it.
435 */
436 do_fancy = cinfo->do_fancy_upsampling && cinfo->_min_DCT_scaled_size > 1;
437
438 /* Verify we can handle the sampling factors, select per-component methods,
439 * and create storage as needed.
440 */
441 for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
442 ci++, compptr++) {
443 /* Compute size of an "input group" after IDCT scaling. This many samples
444 * are to be converted to max_h_samp_factor * max_v_samp_factor pixels.
445 */
446 h_in_group = (compptr->h_samp_factor * compptr->_DCT_scaled_size) /
447 cinfo->_min_DCT_scaled_size;
448 v_in_group = (compptr->v_samp_factor * compptr->_DCT_scaled_size) /
449 cinfo->_min_DCT_scaled_size;
450 h_out_group = cinfo->max_h_samp_factor;
451 v_out_group = cinfo->max_v_samp_factor;
452 upsample->rowgroup_height[ci] = v_in_group; /* save for use later */
453 need_buffer = TRUE;
454 if (! compptr->component_needed) {
455 /* Don't bother to upsample an uninteresting component. */
456 upsample->methods[ci] = noop_upsample;
457 need_buffer = FALSE;
458 } else if (h_in_group == h_out_group && v_in_group == v_out_group) {
459 /* Fullsize components can be processed without any work. */
460 upsample->methods[ci] = fullsize_upsample;
461 need_buffer = FALSE;
462 } else if (h_in_group * 2 == h_out_group &&
463 v_in_group == v_out_group) {
464 /* Special cases for 2h1v upsampling */
465 if (do_fancy && compptr->downsampled_width > 2) {
466 if (jsimd_can_h2v1_fancy_upsample())
467 upsample->methods[ci] = jsimd_h2v1_fancy_upsample;
468 else
469 upsample->methods[ci] = h2v1_fancy_upsample;
470 } else {
471 if (jsimd_can_h2v1_upsample())
472 upsample->methods[ci] = jsimd_h2v1_upsample;
473 else
474 upsample->methods[ci] = h2v1_upsample;
475 }
476 } else if (h_in_group == h_out_group &&
477 v_in_group * 2 == v_out_group && do_fancy) {
478 /* Non-fancy upsampling is handled by the generic method */
479 upsample->methods[ci] = h1v2_fancy_upsample;
480 upsample->pub.need_context_rows = TRUE;
481 } else if (h_in_group * 2 == h_out_group &&
482 v_in_group * 2 == v_out_group) {
483 /* Special cases for 2h2v upsampling */
484 if (do_fancy && compptr->downsampled_width > 2) {
485 if (jsimd_can_h2v2_fancy_upsample())
486 upsample->methods[ci] = jsimd_h2v2_fancy_upsample;
487 else
488 upsample->methods[ci] = h2v2_fancy_upsample;
489 upsample->pub.need_context_rows = TRUE;
490 } else {
491 if (jsimd_can_h2v2_upsample())
492 upsample->methods[ci] = jsimd_h2v2_upsample;
493 else
494 upsample->methods[ci] = h2v2_upsample;
495 }
496 } else if ((h_out_group % h_in_group) == 0 &&
497 (v_out_group % v_in_group) == 0) {
498 /* Generic integral-factors upsampling method */
499 #if defined(__mips__)
500 if (jsimd_can_int_upsample())
501 upsample->methods[ci] = jsimd_int_upsample;
502 else
503 #endif
504 upsample->methods[ci] = int_upsample;
505 upsample->h_expand[ci] = (UINT8) (h_out_group / h_in_group);
506 upsample->v_expand[ci] = (UINT8) (v_out_group / v_in_group);
507 } else
508 ERREXIT(cinfo, JERR_FRACT_SAMPLE_NOTIMPL);
509 if (need_buffer && !cinfo->master->jinit_upsampler_no_alloc) {
510 upsample->color_buf[ci] = (*cinfo->mem->alloc_sarray)
511 ((j_common_ptr) cinfo, JPOOL_IMAGE,
512 (JDIMENSION) jround_up((long) cinfo->output_width,
513 (long) cinfo->max_h_samp_factor),
514 (JDIMENSION) cinfo->max_v_samp_factor);
515 }
516 }
517 }
518