nuclear@14: /*
nuclear@14:  * jdmerge.c
nuclear@14:  *
nuclear@14:  * Copyright (C) 1994-1996, Thomas G. Lane.
nuclear@14:  * This file is part of the Independent JPEG Group's software.
nuclear@14:  * For conditions of distribution and use, see the accompanying README file.
nuclear@14:  *
nuclear@14:  * This file contains code for merged upsampling/color conversion.
nuclear@14:  *
nuclear@14:  * This file combines functions from jdsample.c and jdcolor.c;
nuclear@14:  * read those files first to understand what's going on.
nuclear@14:  *
nuclear@14:  * When the chroma components are to be upsampled by simple replication
nuclear@14:  * (ie, box filtering), we can save some work in color conversion by
nuclear@14:  * calculating all the output pixels corresponding to a pair of chroma
nuclear@14:  * samples at one time.  In the conversion equations
nuclear@14:  *	R = Y           + K1 * Cr
nuclear@14:  *	G = Y + K2 * Cb + K3 * Cr
nuclear@14:  *	B = Y + K4 * Cb
nuclear@14:  * only the Y term varies among the group of pixels corresponding to a pair
nuclear@14:  * of chroma samples, so the rest of the terms can be calculated just once.
nuclear@14:  * At typical sampling ratios, this eliminates half or three-quarters of the
nuclear@14:  * multiplications needed for color conversion.
nuclear@14:  *
nuclear@14:  * This file currently provides implementations for the following cases:
nuclear@14:  *	YCbCr => RGB color conversion only.
nuclear@14:  *	Sampling ratios of 2h1v or 2h2v.
nuclear@14:  *	No scaling needed at upsample time.
nuclear@14:  *	Corner-aligned (non-CCIR601) sampling alignment.
nuclear@14:  * Other special cases could be added, but in most applications these are
nuclear@14:  * the only common cases.  (For uncommon cases we fall back on the more
nuclear@14:  * general code in jdsample.c and jdcolor.c.)
nuclear@14:  */
nuclear@14: 
nuclear@14: #define JPEG_INTERNALS
nuclear@14: #include "jinclude.h"
nuclear@14: #include "jpeglib.h"
nuclear@14: 
nuclear@14: #ifdef UPSAMPLE_MERGING_SUPPORTED
nuclear@14: 
nuclear@14: 
nuclear@14: /* Private subobject */
nuclear@14: 
nuclear@14: typedef struct {
nuclear@14:   struct jpeg_upsampler pub;	/* public fields */
nuclear@14: 
nuclear@14:   /* Pointer to routine to do actual upsampling/conversion of one row group */
nuclear@14:   JMETHOD(void, upmethod, (j_decompress_ptr cinfo,
nuclear@14: 			   JSAMPIMAGE input_buf, JDIMENSION in_row_group_ctr,
nuclear@14: 			   JSAMPARRAY output_buf));
nuclear@14: 
nuclear@14:   /* Private state for YCC->RGB conversion */
nuclear@14:   int * Cr_r_tab;		/* => table for Cr to R conversion */
nuclear@14:   int * Cb_b_tab;		/* => table for Cb to B conversion */
nuclear@14:   INT32 * Cr_g_tab;		/* => table for Cr to G conversion */
nuclear@14:   INT32 * Cb_g_tab;		/* => table for Cb to G conversion */
nuclear@14: 
nuclear@14:   /* For 2:1 vertical sampling, we produce two output rows at a time.
nuclear@14:    * We need a "spare" row buffer to hold the second output row if the
nuclear@14:    * application provides just a one-row buffer; we also use the spare
nuclear@14:    * to discard the dummy last row if the image height is odd.
nuclear@14:    */
nuclear@14:   JSAMPROW spare_row;
nuclear@14:   boolean spare_full;		/* T if spare buffer is occupied */
nuclear@14: 
nuclear@14:   JDIMENSION out_row_width;	/* samples per output row */
nuclear@14:   JDIMENSION rows_to_go;	/* counts rows remaining in image */
nuclear@14: } my_upsampler;
nuclear@14: 
nuclear@14: typedef my_upsampler * my_upsample_ptr;
nuclear@14: 
nuclear@14: #define SCALEBITS	16	/* speediest right-shift on some machines */
nuclear@14: #define ONE_HALF	((INT32) 1 << (SCALEBITS-1))
nuclear@14: #define FIX(x)		((INT32) ((x) * (1L<<SCALEBITS) + 0.5))
nuclear@14: 
nuclear@14: 
nuclear@14: /*
nuclear@14:  * Initialize tables for YCC->RGB colorspace conversion.
nuclear@14:  * This is taken directly from jdcolor.c; see that file for more info.
nuclear@14:  */
nuclear@14: 
nuclear@14: LOCAL(void)
nuclear@14: build_ycc_rgb_table (j_decompress_ptr cinfo)
nuclear@14: {
nuclear@14:   my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
nuclear@14:   int i;
nuclear@14:   INT32 x;
nuclear@14:   SHIFT_TEMPS
nuclear@14: 
nuclear@14:   upsample->Cr_r_tab = (int *)
nuclear@14:     (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
nuclear@14: 				(MAXJSAMPLE+1) * SIZEOF(int));
nuclear@14:   upsample->Cb_b_tab = (int *)
nuclear@14:     (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
nuclear@14: 				(MAXJSAMPLE+1) * SIZEOF(int));
nuclear@14:   upsample->Cr_g_tab = (INT32 *)
nuclear@14:     (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
nuclear@14: 				(MAXJSAMPLE+1) * SIZEOF(INT32));
nuclear@14:   upsample->Cb_g_tab = (INT32 *)
nuclear@14:     (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
nuclear@14: 				(MAXJSAMPLE+1) * SIZEOF(INT32));
nuclear@14: 
nuclear@14:   for (i = 0, x = -CENTERJSAMPLE; i <= MAXJSAMPLE; i++, x++) {
nuclear@14:     /* i is the actual input pixel value, in the range 0..MAXJSAMPLE */
nuclear@14:     /* The Cb or Cr value we are thinking of is x = i - CENTERJSAMPLE */
nuclear@14:     /* Cr=>R value is nearest int to 1.40200 * x */
nuclear@14:     upsample->Cr_r_tab[i] = (int)
nuclear@14: 		    RIGHT_SHIFT(FIX(1.40200) * x + ONE_HALF, SCALEBITS);
nuclear@14:     /* Cb=>B value is nearest int to 1.77200 * x */
nuclear@14:     upsample->Cb_b_tab[i] = (int)
nuclear@14: 		    RIGHT_SHIFT(FIX(1.77200) * x + ONE_HALF, SCALEBITS);
nuclear@14:     /* Cr=>G value is scaled-up -0.71414 * x */
nuclear@14:     upsample->Cr_g_tab[i] = (- FIX(0.71414)) * x;
nuclear@14:     /* Cb=>G value is scaled-up -0.34414 * x */
nuclear@14:     /* We also add in ONE_HALF so that need not do it in inner loop */
nuclear@14:     upsample->Cb_g_tab[i] = (- FIX(0.34414)) * x + ONE_HALF;
nuclear@14:   }
nuclear@14: }
nuclear@14: 
nuclear@14: 
nuclear@14: /*
nuclear@14:  * Initialize for an upsampling pass.
nuclear@14:  */
nuclear@14: 
nuclear@14: METHODDEF(void)
nuclear@14: start_pass_merged_upsample (j_decompress_ptr cinfo)
nuclear@14: {
nuclear@14:   my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
nuclear@14: 
nuclear@14:   /* Mark the spare buffer empty */
nuclear@14:   upsample->spare_full = FALSE;
nuclear@14:   /* Initialize total-height counter for detecting bottom of image */
nuclear@14:   upsample->rows_to_go = cinfo->output_height;
nuclear@14: }
nuclear@14: 
nuclear@14: 
nuclear@14: /*
nuclear@14:  * Control routine to do upsampling (and color conversion).
nuclear@14:  *
nuclear@14:  * The control routine just handles the row buffering considerations.
nuclear@14:  */
nuclear@14: 
nuclear@14: METHODDEF(void)
nuclear@14: merged_2v_upsample (j_decompress_ptr cinfo,
nuclear@14: 		    JSAMPIMAGE input_buf, JDIMENSION *in_row_group_ctr,
nuclear@14: 		    JDIMENSION in_row_groups_avail,
nuclear@14: 		    JSAMPARRAY output_buf, JDIMENSION *out_row_ctr,
nuclear@14: 		    JDIMENSION out_rows_avail)
nuclear@14: /* 2:1 vertical sampling case: may need a spare row. */
nuclear@14: {
nuclear@14:   my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
nuclear@14:   JSAMPROW work_ptrs[2];
nuclear@14:   JDIMENSION num_rows;		/* number of rows returned to caller */
nuclear@14: 
nuclear@14:   if (upsample->spare_full) {
nuclear@14:     /* If we have a spare row saved from a previous cycle, just return it. */
nuclear@14:     jcopy_sample_rows(& upsample->spare_row, 0, output_buf + *out_row_ctr, 0,
nuclear@14: 		      1, upsample->out_row_width);
nuclear@14:     num_rows = 1;
nuclear@14:     upsample->spare_full = FALSE;
nuclear@14:   } else {
nuclear@14:     /* Figure number of rows to return to caller. */
nuclear@14:     num_rows = 2;
nuclear@14:     /* Not more than the distance to the end of the image. */
nuclear@14:     if (num_rows > upsample->rows_to_go)
nuclear@14:       num_rows = upsample->rows_to_go;
nuclear@14:     /* And not more than what the client can accept: */
nuclear@14:     out_rows_avail -= *out_row_ctr;
nuclear@14:     if (num_rows > out_rows_avail)
nuclear@14:       num_rows = out_rows_avail;
nuclear@14:     /* Create output pointer array for upsampler. */
nuclear@14:     work_ptrs[0] = output_buf[*out_row_ctr];
nuclear@14:     if (num_rows > 1) {
nuclear@14:       work_ptrs[1] = output_buf[*out_row_ctr + 1];
nuclear@14:     } else {
nuclear@14:       work_ptrs[1] = upsample->spare_row;
nuclear@14:       upsample->spare_full = TRUE;
nuclear@14:     }
nuclear@14:     /* Now do the upsampling. */
nuclear@14:     (*upsample->upmethod) (cinfo, input_buf, *in_row_group_ctr, work_ptrs);
nuclear@14:   }
nuclear@14: 
nuclear@14:   /* Adjust counts */
nuclear@14:   *out_row_ctr += num_rows;
nuclear@14:   upsample->rows_to_go -= num_rows;
nuclear@14:   /* When the buffer is emptied, declare this input row group consumed */
nuclear@14:   if (! upsample->spare_full)
nuclear@14:     (*in_row_group_ctr)++;
nuclear@14: }
nuclear@14: 
nuclear@14: 
nuclear@14: METHODDEF(void)
nuclear@14: merged_1v_upsample (j_decompress_ptr cinfo,
nuclear@14: 		    JSAMPIMAGE input_buf, JDIMENSION *in_row_group_ctr,
nuclear@14: 		    JDIMENSION in_row_groups_avail,
nuclear@14: 		    JSAMPARRAY output_buf, JDIMENSION *out_row_ctr,
nuclear@14: 		    JDIMENSION out_rows_avail)
nuclear@14: /* 1:1 vertical sampling case: much easier, never need a spare row. */
nuclear@14: {
nuclear@14:   my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
nuclear@14: 
nuclear@14:   /* Just do the upsampling. */
nuclear@14:   (*upsample->upmethod) (cinfo, input_buf, *in_row_group_ctr,
nuclear@14: 			 output_buf + *out_row_ctr);
nuclear@14:   /* Adjust counts */
nuclear@14:   (*out_row_ctr)++;
nuclear@14:   (*in_row_group_ctr)++;
nuclear@14: }
nuclear@14: 
nuclear@14: 
nuclear@14: /*
nuclear@14:  * These are the routines invoked by the control routines to do
nuclear@14:  * the actual upsampling/conversion.  One row group is processed per call.
nuclear@14:  *
nuclear@14:  * Note: since we may be writing directly into application-supplied buffers,
nuclear@14:  * we have to be honest about the output width; we can't assume the buffer
nuclear@14:  * has been rounded up to an even width.
nuclear@14:  */
nuclear@14: 
nuclear@14: 
nuclear@14: /*
nuclear@14:  * Upsample and color convert for the case of 2:1 horizontal and 1:1 vertical.
nuclear@14:  */
nuclear@14: 
nuclear@14: METHODDEF(void)
nuclear@14: h2v1_merged_upsample (j_decompress_ptr cinfo,
nuclear@14: 		      JSAMPIMAGE input_buf, JDIMENSION in_row_group_ctr,
nuclear@14: 		      JSAMPARRAY output_buf)
nuclear@14: {
nuclear@14:   my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
nuclear@14:   register int y, cred, cgreen, cblue;
nuclear@14:   int cb, cr;
nuclear@14:   register JSAMPROW outptr;
nuclear@14:   JSAMPROW inptr0, inptr1, inptr2;
nuclear@14:   JDIMENSION col;
nuclear@14:   /* copy these pointers into registers if possible */
nuclear@14:   register JSAMPLE * range_limit = cinfo->sample_range_limit;
nuclear@14:   int * Crrtab = upsample->Cr_r_tab;
nuclear@14:   int * Cbbtab = upsample->Cb_b_tab;
nuclear@14:   INT32 * Crgtab = upsample->Cr_g_tab;
nuclear@14:   INT32 * Cbgtab = upsample->Cb_g_tab;
nuclear@14:   SHIFT_TEMPS
nuclear@14: 
nuclear@14:   inptr0 = input_buf[0][in_row_group_ctr];
nuclear@14:   inptr1 = input_buf[1][in_row_group_ctr];
nuclear@14:   inptr2 = input_buf[2][in_row_group_ctr];
nuclear@14:   outptr = output_buf[0];
nuclear@14:   /* Loop for each pair of output pixels */
nuclear@14:   for (col = cinfo->output_width >> 1; col > 0; col--) {
nuclear@14:     /* Do the chroma part of the calculation */
nuclear@14:     cb = GETJSAMPLE(*inptr1++);
nuclear@14:     cr = GETJSAMPLE(*inptr2++);
nuclear@14:     cred = Crrtab[cr];
nuclear@14:     cgreen = (int) RIGHT_SHIFT(Cbgtab[cb] + Crgtab[cr], SCALEBITS);
nuclear@14:     cblue = Cbbtab[cb];
nuclear@14:     /* Fetch 2 Y values and emit 2 pixels */
nuclear@14:     y  = GETJSAMPLE(*inptr0++);
nuclear@14:     outptr[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:     outptr += RGB_PIXELSIZE;
nuclear@14:     y  = GETJSAMPLE(*inptr0++);
nuclear@14:     outptr[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:     outptr += RGB_PIXELSIZE;
nuclear@14:   }
nuclear@14:   /* If image width is odd, do the last output column separately */
nuclear@14:   if (cinfo->output_width & 1) {
nuclear@14:     cb = GETJSAMPLE(*inptr1);
nuclear@14:     cr = GETJSAMPLE(*inptr2);
nuclear@14:     cred = Crrtab[cr];
nuclear@14:     cgreen = (int) RIGHT_SHIFT(Cbgtab[cb] + Crgtab[cr], SCALEBITS);
nuclear@14:     cblue = Cbbtab[cb];
nuclear@14:     y  = GETJSAMPLE(*inptr0);
nuclear@14:     outptr[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:   }
nuclear@14: }
nuclear@14: 
nuclear@14: 
nuclear@14: /*
nuclear@14:  * Upsample and color convert for the case of 2:1 horizontal and 2:1 vertical.
nuclear@14:  */
nuclear@14: 
nuclear@14: METHODDEF(void)
nuclear@14: h2v2_merged_upsample (j_decompress_ptr cinfo,
nuclear@14: 		      JSAMPIMAGE input_buf, JDIMENSION in_row_group_ctr,
nuclear@14: 		      JSAMPARRAY output_buf)
nuclear@14: {
nuclear@14:   my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample;
nuclear@14:   register int y, cred, cgreen, cblue;
nuclear@14:   int cb, cr;
nuclear@14:   register JSAMPROW outptr0, outptr1;
nuclear@14:   JSAMPROW inptr00, inptr01, inptr1, inptr2;
nuclear@14:   JDIMENSION col;
nuclear@14:   /* copy these pointers into registers if possible */
nuclear@14:   register JSAMPLE * range_limit = cinfo->sample_range_limit;
nuclear@14:   int * Crrtab = upsample->Cr_r_tab;
nuclear@14:   int * Cbbtab = upsample->Cb_b_tab;
nuclear@14:   INT32 * Crgtab = upsample->Cr_g_tab;
nuclear@14:   INT32 * Cbgtab = upsample->Cb_g_tab;
nuclear@14:   SHIFT_TEMPS
nuclear@14: 
nuclear@14:   inptr00 = input_buf[0][in_row_group_ctr*2];
nuclear@14:   inptr01 = input_buf[0][in_row_group_ctr*2 + 1];
nuclear@14:   inptr1 = input_buf[1][in_row_group_ctr];
nuclear@14:   inptr2 = input_buf[2][in_row_group_ctr];
nuclear@14:   outptr0 = output_buf[0];
nuclear@14:   outptr1 = output_buf[1];
nuclear@14:   /* Loop for each group of output pixels */
nuclear@14:   for (col = cinfo->output_width >> 1; col > 0; col--) {
nuclear@14:     /* Do the chroma part of the calculation */
nuclear@14:     cb = GETJSAMPLE(*inptr1++);
nuclear@14:     cr = GETJSAMPLE(*inptr2++);
nuclear@14:     cred = Crrtab[cr];
nuclear@14:     cgreen = (int) RIGHT_SHIFT(Cbgtab[cb] + Crgtab[cr], SCALEBITS);
nuclear@14:     cblue = Cbbtab[cb];
nuclear@14:     /* Fetch 4 Y values and emit 4 pixels */
nuclear@14:     y  = GETJSAMPLE(*inptr00++);
nuclear@14:     outptr0[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr0[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr0[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:     outptr0 += RGB_PIXELSIZE;
nuclear@14:     y  = GETJSAMPLE(*inptr00++);
nuclear@14:     outptr0[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr0[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr0[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:     outptr0 += RGB_PIXELSIZE;
nuclear@14:     y  = GETJSAMPLE(*inptr01++);
nuclear@14:     outptr1[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr1[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr1[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:     outptr1 += RGB_PIXELSIZE;
nuclear@14:     y  = GETJSAMPLE(*inptr01++);
nuclear@14:     outptr1[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr1[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr1[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:     outptr1 += RGB_PIXELSIZE;
nuclear@14:   }
nuclear@14:   /* If image width is odd, do the last output column separately */
nuclear@14:   if (cinfo->output_width & 1) {
nuclear@14:     cb = GETJSAMPLE(*inptr1);
nuclear@14:     cr = GETJSAMPLE(*inptr2);
nuclear@14:     cred = Crrtab[cr];
nuclear@14:     cgreen = (int) RIGHT_SHIFT(Cbgtab[cb] + Crgtab[cr], SCALEBITS);
nuclear@14:     cblue = Cbbtab[cb];
nuclear@14:     y  = GETJSAMPLE(*inptr00);
nuclear@14:     outptr0[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr0[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr0[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:     y  = GETJSAMPLE(*inptr01);
nuclear@14:     outptr1[RGB_RED] =   range_limit[y + cred];
nuclear@14:     outptr1[RGB_GREEN] = range_limit[y + cgreen];
nuclear@14:     outptr1[RGB_BLUE] =  range_limit[y + cblue];
nuclear@14:   }
nuclear@14: }
nuclear@14: 
nuclear@14: 
nuclear@14: /*
nuclear@14:  * Module initialization routine for merged upsampling/color conversion.
nuclear@14:  *
nuclear@14:  * NB: this is called under the conditions determined by use_merged_upsample()
nuclear@14:  * in jdmaster.c.  That routine MUST correspond to the actual capabilities
nuclear@14:  * of this module; no safety checks are made here.
nuclear@14:  */
nuclear@14: 
nuclear@14: GLOBAL(void)
nuclear@14: jinit_merged_upsampler (j_decompress_ptr cinfo)
nuclear@14: {
nuclear@14:   my_upsample_ptr upsample;
nuclear@14: 
nuclear@14:   upsample = (my_upsample_ptr)
nuclear@14:     (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
nuclear@14: 				SIZEOF(my_upsampler));
nuclear@14:   cinfo->upsample = (struct jpeg_upsampler *) upsample;
nuclear@14:   upsample->pub.start_pass = start_pass_merged_upsample;
nuclear@14:   upsample->pub.need_context_rows = FALSE;
nuclear@14: 
nuclear@14:   upsample->out_row_width = cinfo->output_width * cinfo->out_color_components;
nuclear@14: 
nuclear@14:   if (cinfo->max_v_samp_factor == 2) {
nuclear@14:     upsample->pub.upsample = merged_2v_upsample;
nuclear@14:     upsample->upmethod = h2v2_merged_upsample;
nuclear@14:     /* Allocate a spare row buffer */
nuclear@14:     upsample->spare_row = (JSAMPROW)
nuclear@14:       (*cinfo->mem->alloc_large) ((j_common_ptr) cinfo, JPOOL_IMAGE,
nuclear@14: 		(size_t) (upsample->out_row_width * SIZEOF(JSAMPLE)));
nuclear@14:   } else {
nuclear@14:     upsample->pub.upsample = merged_1v_upsample;
nuclear@14:     upsample->upmethod = h2v1_merged_upsample;
nuclear@14:     /* No spare row needed */
nuclear@14:     upsample->spare_row = NULL;
nuclear@14:   }
nuclear@14: 
nuclear@14:   build_ycc_rgb_table(cinfo);
nuclear@14: }
nuclear@14: 
nuclear@14: #endif /* UPSAMPLE_MERGING_SUPPORTED */