4 * This file was part of the Independent JPEG Group's software:
5 * Copyright (C) 1994-1996, Thomas G. Lane.
6 * libjpeg-turbo Modifications:
7 * Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
8 * Copyright (C) 2009, 2011, 2014-2015, 2020, 2022, D. R. Commander.
9 * Copyright (C) 2013, Linaro Limited.
10 * For conditions of distribution and use, see the accompanying README.ijg
13 * This file contains code for merged upsampling/color conversion.
15 * This file combines functions from jdsample.c and jdcolor.c;
16 * read those files first to understand what's going on.
18 * When the chroma components are to be upsampled by simple replication
19 * (ie, box filtering), we can save some work in color conversion by
20 * calculating all the output pixels corresponding to a pair of chroma
21 * samples at one time. In the conversion equations
23 * G = Y + K2 * Cb + K3 * Cr
25 * only the Y term varies among the group of pixels corresponding to a pair
26 * of chroma samples, so the rest of the terms can be calculated just once.
27 * At typical sampling ratios, this eliminates half or three-quarters of the
28 * multiplications needed for color conversion.
30 * This file currently provides implementations for the following cases:
31 * YCbCr => RGB color conversion only.
32 * Sampling ratios of 2h1v or 2h2v.
33 * No scaling needed at upsample time.
34 * Corner-aligned (non-CCIR601) sampling alignment.
35 * Other special cases could be added, but in most applications these are
36 * the only common cases. (For uncommon cases we fall back on the more
37 * general code in jdsample.c and jdcolor.c.)
40 #define JPEG_INTERNALS
46 #ifdef UPSAMPLE_MERGING_SUPPORTED
49 #define SCALEBITS 16 /* speediest right-shift on some machines */
50 #define ONE_HALF ((JLONG)1 << (SCALEBITS - 1))
51 #define FIX(x) ((JLONG)((x) * (1L << SCALEBITS) + 0.5))
54 /* Include inline routines for colorspace extensions */
62 #define RGB_RED EXT_RGB_RED
63 #define RGB_GREEN EXT_RGB_GREEN
64 #define RGB_BLUE EXT_RGB_BLUE
65 #define RGB_PIXELSIZE EXT_RGB_PIXELSIZE
66 #define h2v1_merged_upsample_internal extrgb_h2v1_merged_upsample_internal
67 #define h2v2_merged_upsample_internal extrgb_h2v2_merged_upsample_internal
73 #undef h2v1_merged_upsample_internal
74 #undef h2v2_merged_upsample_internal
76 #define RGB_RED EXT_RGBX_RED
77 #define RGB_GREEN EXT_RGBX_GREEN
78 #define RGB_BLUE EXT_RGBX_BLUE
80 #define RGB_PIXELSIZE EXT_RGBX_PIXELSIZE
81 #define h2v1_merged_upsample_internal extrgbx_h2v1_merged_upsample_internal
82 #define h2v2_merged_upsample_internal extrgbx_h2v2_merged_upsample_internal
89 #undef h2v1_merged_upsample_internal
90 #undef h2v2_merged_upsample_internal
92 #define RGB_RED EXT_BGR_RED
93 #define RGB_GREEN EXT_BGR_GREEN
94 #define RGB_BLUE EXT_BGR_BLUE
95 #define RGB_PIXELSIZE EXT_BGR_PIXELSIZE
96 #define h2v1_merged_upsample_internal extbgr_h2v1_merged_upsample_internal
97 #define h2v2_merged_upsample_internal extbgr_h2v2_merged_upsample_internal
103 #undef h2v1_merged_upsample_internal
104 #undef h2v2_merged_upsample_internal
106 #define RGB_RED EXT_BGRX_RED
107 #define RGB_GREEN EXT_BGRX_GREEN
108 #define RGB_BLUE EXT_BGRX_BLUE
110 #define RGB_PIXELSIZE EXT_BGRX_PIXELSIZE
111 #define h2v1_merged_upsample_internal extbgrx_h2v1_merged_upsample_internal
112 #define h2v2_merged_upsample_internal extbgrx_h2v2_merged_upsample_internal
113 #include "jdmrgext.c"
119 #undef h2v1_merged_upsample_internal
120 #undef h2v2_merged_upsample_internal
122 #define RGB_RED EXT_XBGR_RED
123 #define RGB_GREEN EXT_XBGR_GREEN
124 #define RGB_BLUE EXT_XBGR_BLUE
126 #define RGB_PIXELSIZE EXT_XBGR_PIXELSIZE
127 #define h2v1_merged_upsample_internal extxbgr_h2v1_merged_upsample_internal
128 #define h2v2_merged_upsample_internal extxbgr_h2v2_merged_upsample_internal
129 #include "jdmrgext.c"
135 #undef h2v1_merged_upsample_internal
136 #undef h2v2_merged_upsample_internal
138 #define RGB_RED EXT_XRGB_RED
139 #define RGB_GREEN EXT_XRGB_GREEN
140 #define RGB_BLUE EXT_XRGB_BLUE
142 #define RGB_PIXELSIZE EXT_XRGB_PIXELSIZE
143 #define h2v1_merged_upsample_internal extxrgb_h2v1_merged_upsample_internal
144 #define h2v2_merged_upsample_internal extxrgb_h2v2_merged_upsample_internal
145 #include "jdmrgext.c"
151 #undef h2v1_merged_upsample_internal
152 #undef h2v2_merged_upsample_internal
156 * Initialize tables for YCC->RGB colorspace conversion.
157 * This is taken directly from jdcolor.c; see that file for more info.
161 build_ycc_rgb_table(j_decompress_ptr cinfo)
163 my_merged_upsample_ptr upsample = (my_merged_upsample_ptr)cinfo->upsample;
168 upsample->Cr_r_tab = (int *)
169 (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
170 (_MAXJSAMPLE + 1) * sizeof(int));
171 upsample->Cb_b_tab = (int *)
172 (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
173 (_MAXJSAMPLE + 1) * sizeof(int));
174 upsample->Cr_g_tab = (JLONG *)
175 (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
176 (_MAXJSAMPLE + 1) * sizeof(JLONG));
177 upsample->Cb_g_tab = (JLONG *)
178 (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
179 (_MAXJSAMPLE + 1) * sizeof(JLONG));
181 for (i = 0, x = -_CENTERJSAMPLE; i <= _MAXJSAMPLE; i++, x++) {
182 /* i is the actual input pixel value, in the range 0.._MAXJSAMPLE */
183 /* The Cb or Cr value we are thinking of is x = i - _CENTERJSAMPLE */
184 /* Cr=>R value is nearest int to 1.40200 * x */
185 upsample->Cr_r_tab[i] = (int)
186 RIGHT_SHIFT(FIX(1.40200) * x + ONE_HALF, SCALEBITS);
187 /* Cb=>B value is nearest int to 1.77200 * x */
188 upsample->Cb_b_tab[i] = (int)
189 RIGHT_SHIFT(FIX(1.77200) * x + ONE_HALF, SCALEBITS);
190 /* Cr=>G value is scaled-up -0.71414 * x */
191 upsample->Cr_g_tab[i] = (-FIX(0.71414)) * x;
192 /* Cb=>G value is scaled-up -0.34414 * x */
193 /* We also add in ONE_HALF so that need not do it in inner loop */
194 upsample->Cb_g_tab[i] = (-FIX(0.34414)) * x + ONE_HALF;
200 * Initialize for an upsampling pass.
204 start_pass_merged_upsample(j_decompress_ptr cinfo)
206 my_merged_upsample_ptr upsample = (my_merged_upsample_ptr)cinfo->upsample;
208 /* Mark the spare buffer empty */
209 upsample->spare_full = FALSE;
210 /* Initialize total-height counter for detecting bottom of image */
211 upsample->rows_to_go = cinfo->output_height;
216 * Control routine to do upsampling (and color conversion).
218 * The control routine just handles the row buffering considerations.
222 merged_2v_upsample(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
223 JDIMENSION *in_row_group_ctr,
224 JDIMENSION in_row_groups_avail, _JSAMPARRAY output_buf,
225 JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail)
226 /* 2:1 vertical sampling case: may need a spare row. */
228 my_merged_upsample_ptr upsample = (my_merged_upsample_ptr)cinfo->upsample;
229 _JSAMPROW work_ptrs[2];
230 JDIMENSION num_rows; /* number of rows returned to caller */
235 if (upsample->spare_full) {
236 /* If we have a spare row saved from a previous cycle, just return it. */
237 JDIMENSION size = upsample->out_row_width;
238 if (cinfo->out_color_space == JCS_RGB565)
239 size = cinfo->output_width * 2;
241 _jcopy_sample_rows(& upsample->spare_row, 0, output_buf + *out_row_ctr, 0,
242 1, upsample->out_row_width);
244 _jcopy_sample_rows(&upsample->spare_row, 0, output_buf + *out_row_ctr, 0,
248 upsample->spare_full = FALSE;
251 int _region_y = (int)cinfo->region_y;
252 _region_y = (_region_y>>1)<<1;
253 if ((cinfo->region_w > 0) && (cinfo->region_h > 0)) {
254 if (((int)cinfo->output_scanline < _region_y) ||
255 ((int)cinfo->output_scanline >= (_region_y + (int)cinfo->region_h)))
259 /* Figure number of rows to return to caller. */
261 /* Not more than the distance to the end of the image. */
262 if (num_rows > upsample->rows_to_go)
263 num_rows = upsample->rows_to_go;
264 /* And not more than what the client can accept: */
265 out_rows_avail -= *out_row_ctr;
266 if (num_rows > out_rows_avail)
267 num_rows = out_rows_avail;
268 /* Create output pointer array for upsampler. */
269 work_ptrs[0] = output_buf[*out_row_ctr];
271 work_ptrs[1] = output_buf[*out_row_ctr + 1];
273 work_ptrs[1] = upsample->spare_row;
274 upsample->spare_full = TRUE;
276 /* Now do the upsampling. */
279 (*upsample->upmethod) (cinfo, input_buf, *in_row_group_ctr, work_ptrs);
281 (*upsample->upmethod) (cinfo, input_buf, *in_row_group_ctr, work_ptrs);
286 *out_row_ctr += num_rows;
287 upsample->rows_to_go -= num_rows;
288 /* When the buffer is emptied, declare this input row group consumed */
289 if (!upsample->spare_full)
290 (*in_row_group_ctr)++;
295 merged_1v_upsample(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
296 JDIMENSION *in_row_group_ctr,
297 JDIMENSION in_row_groups_avail, _JSAMPARRAY output_buf,
298 JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail)
299 /* 1:1 vertical sampling case: much easier, never need a spare row. */
301 my_merged_upsample_ptr upsample = (my_merged_upsample_ptr)cinfo->upsample;
303 /* Just do the upsampling. */
304 (*upsample->upmethod) (cinfo, input_buf, *in_row_group_ctr,
305 output_buf + *out_row_ctr);
308 (*in_row_group_ctr)++;
313 * These are the routines invoked by the control routines to do
314 * the actual upsampling/conversion. One row group is processed per call.
316 * Note: since we may be writing directly into application-supplied buffers,
317 * we have to be honest about the output width; we can't assume the buffer
318 * has been rounded up to an even width.
323 * Upsample and color convert for the case of 2:1 horizontal and 1:1 vertical.
327 h2v1_merged_upsample(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
328 JDIMENSION in_row_group_ctr, _JSAMPARRAY output_buf)
330 switch (cinfo->out_color_space) {
332 extrgb_h2v1_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
337 extrgbx_h2v1_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
341 extbgr_h2v1_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
346 extbgrx_h2v1_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
351 extxbgr_h2v1_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
356 extxrgb_h2v1_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
360 h2v1_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
368 * Upsample and color convert for the case of 2:1 horizontal and 2:1 vertical.
372 h2v2_merged_upsample(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
373 JDIMENSION in_row_group_ctr, _JSAMPARRAY output_buf)
375 switch (cinfo->out_color_space) {
377 extrgb_h2v2_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
382 extrgbx_h2v2_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
386 extbgr_h2v2_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
391 extbgrx_h2v2_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
396 extxbgr_h2v2_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
401 extxrgb_h2v2_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
405 h2v2_merged_upsample_internal(cinfo, input_buf, in_row_group_ctr,
416 #define PACK_SHORT_565_LE(r, g, b) \
417 ((((r) << 8) & 0xF800) | (((g) << 3) & 0x7E0) | ((b) >> 3))
418 #define PACK_SHORT_565_BE(r, g, b) \
419 (((r) & 0xF8) | ((g) >> 5) | (((g) << 11) & 0xE000) | (((b) << 5) & 0x1F00))
421 #define PACK_TWO_PIXELS_LE(l, r) ((r << 16) | l)
422 #define PACK_TWO_PIXELS_BE(l, r) ((l << 16) | r)
424 #define WRITE_TWO_PIXELS_LE(addr, pixels) { \
425 ((INT16 *)(addr))[0] = (INT16)(pixels); \
426 ((INT16 *)(addr))[1] = (INT16)((pixels) >> 16); \
428 #define WRITE_TWO_PIXELS_BE(addr, pixels) { \
429 ((INT16 *)(addr))[1] = (INT16)(pixels); \
430 ((INT16 *)(addr))[0] = (INT16)((pixels) >> 16); \
433 #define DITHER_565_R(r, dither) ((r) + ((dither) & 0xFF))
434 #define DITHER_565_G(g, dither) ((g) + (((dither) & 0xFF) >> 1))
435 #define DITHER_565_B(b, dither) ((b) + ((dither) & 0xFF))
438 /* Declarations for ordered dithering
440 * We use a 4x4 ordered dither array packed into 32 bits. This array is
441 * sufficient for dithering RGB888 to RGB565.
444 #define DITHER_MASK 0x3
445 #define DITHER_ROTATE(x) ((((x) & 0xFF) << 24) | (((x) >> 8) & 0x00FFFFFF))
446 static const JLONG dither_matrix[4] = {
454 /* Include inline routines for RGB565 conversion */
456 #define PACK_SHORT_565 PACK_SHORT_565_LE
457 #define PACK_TWO_PIXELS PACK_TWO_PIXELS_LE
458 #define WRITE_TWO_PIXELS WRITE_TWO_PIXELS_LE
459 #define h2v1_merged_upsample_565_internal h2v1_merged_upsample_565_le
460 #define h2v1_merged_upsample_565D_internal h2v1_merged_upsample_565D_le
461 #define h2v2_merged_upsample_565_internal h2v2_merged_upsample_565_le
462 #define h2v2_merged_upsample_565D_internal h2v2_merged_upsample_565D_le
463 #include "jdmrg565.c"
464 #undef PACK_SHORT_565
465 #undef PACK_TWO_PIXELS
466 #undef WRITE_TWO_PIXELS
467 #undef h2v1_merged_upsample_565_internal
468 #undef h2v1_merged_upsample_565D_internal
469 #undef h2v2_merged_upsample_565_internal
470 #undef h2v2_merged_upsample_565D_internal
472 #define PACK_SHORT_565 PACK_SHORT_565_BE
473 #define PACK_TWO_PIXELS PACK_TWO_PIXELS_BE
474 #define WRITE_TWO_PIXELS WRITE_TWO_PIXELS_BE
475 #define h2v1_merged_upsample_565_internal h2v1_merged_upsample_565_be
476 #define h2v1_merged_upsample_565D_internal h2v1_merged_upsample_565D_be
477 #define h2v2_merged_upsample_565_internal h2v2_merged_upsample_565_be
478 #define h2v2_merged_upsample_565D_internal h2v2_merged_upsample_565D_be
479 #include "jdmrg565.c"
480 #undef PACK_SHORT_565
481 #undef PACK_TWO_PIXELS
482 #undef WRITE_TWO_PIXELS
483 #undef h2v1_merged_upsample_565_internal
484 #undef h2v1_merged_upsample_565D_internal
485 #undef h2v2_merged_upsample_565_internal
486 #undef h2v2_merged_upsample_565D_internal
489 static INLINE boolean is_big_endian(void)
492 if (*(char *)&test_value != 1)
499 h2v1_merged_upsample_565(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
500 JDIMENSION in_row_group_ctr, _JSAMPARRAY output_buf)
503 h2v1_merged_upsample_565_be(cinfo, input_buf, in_row_group_ctr,
506 h2v1_merged_upsample_565_le(cinfo, input_buf, in_row_group_ctr,
512 h2v1_merged_upsample_565D(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
513 JDIMENSION in_row_group_ctr, _JSAMPARRAY output_buf)
516 h2v1_merged_upsample_565D_be(cinfo, input_buf, in_row_group_ctr,
519 h2v1_merged_upsample_565D_le(cinfo, input_buf, in_row_group_ctr,
525 h2v2_merged_upsample_565(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
526 JDIMENSION in_row_group_ctr, _JSAMPARRAY output_buf)
529 h2v2_merged_upsample_565_be(cinfo, input_buf, in_row_group_ctr,
532 h2v2_merged_upsample_565_le(cinfo, input_buf, in_row_group_ctr,
538 h2v2_merged_upsample_565D(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
539 JDIMENSION in_row_group_ctr, _JSAMPARRAY output_buf)
542 h2v2_merged_upsample_565D_be(cinfo, input_buf, in_row_group_ctr,
545 h2v2_merged_upsample_565D_le(cinfo, input_buf, in_row_group_ctr,
551 * Module initialization routine for merged upsampling/color conversion.
553 * NB: this is called under the conditions determined by use_merged_upsample()
554 * in jdmaster.c. That routine MUST correspond to the actual capabilities
555 * of this module; no safety checks are made here.
559 _jinit_merged_upsampler(j_decompress_ptr cinfo)
561 my_merged_upsample_ptr upsample;
563 if (cinfo->data_precision != BITS_IN_JSAMPLE)
564 ERREXIT1(cinfo, JERR_BAD_PRECISION, cinfo->data_precision);
566 upsample = (my_merged_upsample_ptr)
567 (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
568 sizeof(my_merged_upsampler));
569 cinfo->upsample = (struct jpeg_upsampler *)upsample;
570 upsample->pub.start_pass = start_pass_merged_upsample;
571 upsample->pub.need_context_rows = FALSE;
573 upsample->out_row_width = cinfo->output_width * cinfo->out_color_components;
575 if (cinfo->max_v_samp_factor == 2) {
576 upsample->pub._upsample = merged_2v_upsample;
578 if (jsimd_can_h2v2_merged_upsample())
579 upsample->upmethod = jsimd_h2v2_merged_upsample;
582 upsample->upmethod = h2v2_merged_upsample;
583 if (cinfo->out_color_space == JCS_RGB565) {
584 if (cinfo->dither_mode != JDITHER_NONE) {
585 upsample->upmethod = h2v2_merged_upsample_565D;
587 upsample->upmethod = h2v2_merged_upsample_565;
590 /* Allocate a spare row buffer */
591 upsample->spare_row = (_JSAMPROW)
592 (*cinfo->mem->alloc_large) ((j_common_ptr)cinfo, JPOOL_IMAGE,
593 (size_t)(upsample->out_row_width * sizeof(_JSAMPLE)));
595 upsample->pub._upsample = merged_1v_upsample;
597 if (jsimd_can_h2v1_merged_upsample())
598 upsample->upmethod = jsimd_h2v1_merged_upsample;
601 upsample->upmethod = h2v1_merged_upsample;
602 if (cinfo->out_color_space == JCS_RGB565) {
603 if (cinfo->dither_mode != JDITHER_NONE) {
604 upsample->upmethod = h2v1_merged_upsample_565D;
606 upsample->upmethod = h2v1_merged_upsample_565;
609 /* No spare row needed */
610 upsample->spare_row = NULL;
613 build_ycc_rgb_table(cinfo);
616 #endif /* UPSAMPLE_MERGING_SUPPORTED */