third_party/libjpeg_turbo/jidctred.c - Issue 4134011: Adds libjpeg-turbo to deps...

Side by Side Diff: third_party/libjpeg_turbo/jidctred.c

Issue 4134011: Adds libjpeg-turbo to deps... (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/deps/

Patch Set: Created 10 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

OLD	NEW
(Empty)
	1 /*

	2 * jidctred.c

	3 *

	4 * Copyright (C) 1994-1998, Thomas G. Lane.

	5 * This file is part of the Independent JPEG Group's software.

	6 * For conditions of distribution and use, see the accompanying README file.

	7 *

	8 * This file contains inverse-DCT routines that produce reduced-size output:

	9 * either 4x4, 2x2, or 1x1 pixels from an 8x8 DCT block.

	10 *

	11 * The implementation is based on the Loeffler, Ligtenberg and Moschytz (LL&M)

	12 * algorithm used in jidctint.c. We simply replace each 8-to-8 1-D IDCT step

	13 * with an 8-to-4 step that produces the four averages of two adjacent outputs

	14 * (or an 8-to-2 step producing two averages of four outputs, for 2x2 output).

	15 * These steps were derived by computing the corresponding values at the end

	16 * of the normal LL&M code, then simplifying as much as possible.

	17 *

	18 * 1x1 is trivial: just take the DC coefficient divided by 8.

	19 *

	20 * See jidctint.c for additional comments.

	21 */

	22

	23 #define JPEG_INTERNALS

	24 #include "jinclude.h"

	25 #include "jpeglib.h"

	26 #include "jdct.h" /* Private declarations for DCT subsystem */

	27

	28 #ifdef IDCT_SCALING_SUPPORTED

	29

	30

	31 /*

	32 * This module is specialized to the case DCTSIZE = 8.

	33 */

	34

	35 #if DCTSIZE != 8

	36 Sorry, this code only copes with 8x8 DCTs. /* deliberate syntax err */

	37 #endif

	38

	39

	40 /* Scaling is the same as in jidctint.c. */

	41

	42 #if BITS_IN_JSAMPLE == 8

	43 #define CONST_BITS 13

	44 #define PASS1_BITS 2

	45 #else

	46 #define CONST_BITS 13

	47 #define PASS1_BITS 1 /* lose a little precision to avoid overflow */

	48 #endif

	49

	50 /* Some C compilers fail to reduce "FIX(constant)" at compile time, thus

	51 * causing a lot of useless floating-point operations at run time.

	52 * To get around this we use the following pre-calculated constants.

	53 * If you change CONST_BITS you may want to add appropriate values.

	54 * (With a reasonable C compiler, you can just rely on the FIX() macro...)

	55 */

	56

	57 #if CONST_BITS == 13

	58 #define FIX_0_211164243 ((INT32) 1730) /* FIX(0.211164243) */

	59 #define FIX_0_509795579 ((INT32) 4176) /* FIX(0.509795579) */

	60 #define FIX_0_601344887 ((INT32) 4926) /* FIX(0.601344887) */

	61 #define FIX_0_720959822 ((INT32) 5906) /* FIX(0.720959822) */

	62 #define FIX_0_765366865 ((INT32) 6270) /* FIX(0.765366865) */

	63 #define FIX_0_850430095 ((INT32) 6967) /* FIX(0.850430095) */

	64 #define FIX_0_899976223 ((INT32) 7373) /* FIX(0.899976223) */

	65 #define FIX_1_061594337 ((INT32) 8697) /* FIX(1.061594337) */

	66 #define FIX_1_272758580 ((INT32) 10426) /* FIX(1.272758580) */

	67 #define FIX_1_451774981 ((INT32) 11893) /* FIX(1.451774981) */

	68 #define FIX_1_847759065 ((INT32) 15137) /* FIX(1.847759065) */

	69 #define FIX_2_172734803 ((INT32) 17799) /* FIX(2.172734803) */

	70 #define FIX_2_562915447 ((INT32) 20995) /* FIX(2.562915447) */

	71 #define FIX_3_624509785 ((INT32) 29692) /* FIX(3.624509785) */

	72 #else

	73 #define FIX_0_211164243 FIX(0.211164243)

	74 #define FIX_0_509795579 FIX(0.509795579)

	75 #define FIX_0_601344887 FIX(0.601344887)

	76 #define FIX_0_720959822 FIX(0.720959822)

	77 #define FIX_0_765366865 FIX(0.765366865)

	78 #define FIX_0_850430095 FIX(0.850430095)

	79 #define FIX_0_899976223 FIX(0.899976223)

	80 #define FIX_1_061594337 FIX(1.061594337)

	81 #define FIX_1_272758580 FIX(1.272758580)

	82 #define FIX_1_451774981 FIX(1.451774981)

	83 #define FIX_1_847759065 FIX(1.847759065)

	84 #define FIX_2_172734803 FIX(2.172734803)

	85 #define FIX_2_562915447 FIX(2.562915447)

	86 #define FIX_3_624509785 FIX(3.624509785)

	87 #endif

	88

	89

	90 /* Multiply an INT32 variable by an INT32 constant to yield an INT32 result.

	91 * For 8-bit samples with the recommended scaling, all the variable

	92 * and constant values involved are no more than 16 bits wide, so a

	93 * 16x16->32 bit multiply can be used instead of a full 32x32 multiply.

	94 * For 12-bit samples, a full 32-bit multiplication will be needed.

	95 */

	96

	97 #if BITS_IN_JSAMPLE == 8

	98 #define MULTIPLY(var,const) MULTIPLY16C16(var,const)

	99 #else

	100 #define MULTIPLY(var,const) ((var) * (const))

	101 #endif

	102

	103

	104 /* Dequantize a coefficient by multiplying it by the multiplier-table

	105 * entry; produce an int result. In this module, both inputs and result

	106 * are 16 bits or less, so either int or short multiply will work.

	107 */

	108

	109 #define DEQUANTIZE(coef,quantval) (((ISLOW_MULT_TYPE) (coef)) * (quantval))

	110

	111

	112 /*

	113 * Perform dequantization and inverse DCT on one block of coefficients,

	114 * producing a reduced-size 4x4 output block.

	115 */

	116

	117 GLOBAL(void)

	118 jpeg_idct_4x4 (j_decompress_ptr cinfo, jpeg_component_info * compptr,

	119 JCOEFPTR coef_block,

	120 JSAMPARRAY output_buf, JDIMENSION output_col)

	121 {

	122 INT32 tmp0, tmp2, tmp10, tmp12;

	123 INT32 z1, z2, z3, z4;

	124 JCOEFPTR inptr;

	125 ISLOW_MULT_TYPE * quantptr;

	126 int * wsptr;

	127 JSAMPROW outptr;

	128 JSAMPLE *range_limit = IDCT_range_limit(cinfo);

	129 int ctr;

	130 int workspace[DCTSIZE4]; / buffers data between passes */

	131 SHIFT_TEMPS

	132

	133 /* Pass 1: process columns from input, store into work array. */

	134

	135 inptr = coef_block;

	136 quantptr = (ISLOW_MULT_TYPE *) compptr->dct_table;

	137 wsptr = workspace;

	138 for (ctr = DCTSIZE; ctr > 0; inptr++, quantptr++, wsptr++, ctr--) {

	139 /* Don't bother to process column 4, because second pass won't use it */

	140 if (ctr == DCTSIZE-4)

	141 continue;

	142 if (inptr[DCTSIZE1] == 0 && inptr[DCTSIZE2] == 0 &&

	143 inptr[DCTSIZE3] == 0 && inptr[DCTSIZE5] == 0 &&

	144 inptr[DCTSIZE6] == 0 && inptr[DCTSIZE7] == 0) {

	145 /* AC terms all zero; we need not examine term 4 for 4x4 output */

	146 int dcval = DEQUANTIZE(inptr[DCTSIZE0], quantptr[DCTSIZE0]) << PASS1_BIT S;

	147

	148 wsptr[DCTSIZE*0] = dcval;

	149 wsptr[DCTSIZE*1] = dcval;

	150 wsptr[DCTSIZE*2] = dcval;

	151 wsptr[DCTSIZE*3] = dcval;

	152

	153 continue;

	154 }

	155

	156 /* Even part */

	157

	158 tmp0 = DEQUANTIZE(inptr[DCTSIZE0], quantptr[DCTSIZE0]);

	159 tmp0 <<= (CONST_BITS+1);

	160

	161 z2 = DEQUANTIZE(inptr[DCTSIZE2], quantptr[DCTSIZE2]);

	162 z3 = DEQUANTIZE(inptr[DCTSIZE6], quantptr[DCTSIZE6]);

	163

	164 tmp2 = MULTIPLY(z2, FIX_1_847759065) + MULTIPLY(z3, - FIX_0_765366865);

	165

	166 tmp10 = tmp0 + tmp2;

	167 tmp12 = tmp0 - tmp2;

	168

	169 /* Odd part */

	170

	171 z1 = DEQUANTIZE(inptr[DCTSIZE7], quantptr[DCTSIZE7]);

	172 z2 = DEQUANTIZE(inptr[DCTSIZE5], quantptr[DCTSIZE5]);

	173 z3 = DEQUANTIZE(inptr[DCTSIZE3], quantptr[DCTSIZE3]);

	174 z4 = DEQUANTIZE(inptr[DCTSIZE1], quantptr[DCTSIZE1]);

	175

	176 tmp0 = MULTIPLY(z1, - FIX_0_211164243) /* sqrt(2) * (c3-c1) */

	177 + MULTIPLY(z2, FIX_1_451774981) /* sqrt(2) * (c3+c7) */

	178 + MULTIPLY(z3, - FIX_2_172734803) /* sqrt(2) * (-c1-c5) */

	179 + MULTIPLY(z4, FIX_1_061594337); /* sqrt(2) * (c5+c7) */

	180

	181 tmp2 = MULTIPLY(z1, - FIX_0_509795579) /* sqrt(2) * (c7-c5) */

	182 + MULTIPLY(z2, - FIX_0_601344887) /* sqrt(2) * (c5-c1) */

	183 + MULTIPLY(z3, FIX_0_899976223) /* sqrt(2) * (c3-c7) */

	184 + MULTIPLY(z4, FIX_2_562915447); /* sqrt(2) * (c1+c3) */

	185

	186 /* Final output stage */

	187

	188 wsptr[DCTSIZE*0] = (int) DESCALE(tmp10 + tmp2, CONST_BITS-PASS1_BITS+1);

	189 wsptr[DCTSIZE*3] = (int) DESCALE(tmp10 - tmp2, CONST_BITS-PASS1_BITS+1);

	190 wsptr[DCTSIZE*1] = (int) DESCALE(tmp12 + tmp0, CONST_BITS-PASS1_BITS+1);

	191 wsptr[DCTSIZE*2] = (int) DESCALE(tmp12 - tmp0, CONST_BITS-PASS1_BITS+1);

	192 }

	193

	194 /* Pass 2: process 4 rows from work array, store into output array. */

	195

	196 wsptr = workspace;

	197 for (ctr = 0; ctr < 4; ctr++) {

	198 outptr = output_buf[ctr] + output_col;

	199 /* It's not clear whether a zero row test is worthwhile here ... */

	200

	201 #ifndef NO_ZERO_ROW_TEST

	202 if (wsptr[1] == 0 && wsptr[2] == 0 && wsptr[3] == 0 &&

	203 wsptr[5] == 0 && wsptr[6] == 0 && wsptr[7] == 0) {

	204 /* AC terms all zero */

	205 JSAMPLE dcval = range_limit[(int) DESCALE((INT32) wsptr[0], PASS1_BITS+3)

	206 & RANGE_MASK];

	207

	208 outptr[0] = dcval;

	209 outptr[1] = dcval;

	210 outptr[2] = dcval;

	211 outptr[3] = dcval;

	212

	213 wsptr += DCTSIZE; /* advance pointer to next row */

	214 continue;

	215 }

	216 #endif

	217

	218 /* Even part */

	219

	220 tmp0 = ((INT32) wsptr[0]) << (CONST_BITS+1);

	221

	222 tmp2 = MULTIPLY((INT32) wsptr[2], FIX_1_847759065)

	223 + MULTIPLY((INT32) wsptr[6], - FIX_0_765366865);

	224

	225 tmp10 = tmp0 + tmp2;

	226 tmp12 = tmp0 - tmp2;

	227

	228 /* Odd part */

	229

	230 z1 = (INT32) wsptr[7];

	231 z2 = (INT32) wsptr[5];

	232 z3 = (INT32) wsptr[3];

	233 z4 = (INT32) wsptr[1];

	234

	235 tmp0 = MULTIPLY(z1, - FIX_0_211164243) /* sqrt(2) * (c3-c1) */

	236 + MULTIPLY(z2, FIX_1_451774981) /* sqrt(2) * (c3+c7) */

	237 + MULTIPLY(z3, - FIX_2_172734803) /* sqrt(2) * (-c1-c5) */

	238 + MULTIPLY(z4, FIX_1_061594337); /* sqrt(2) * (c5+c7) */

	239

	240 tmp2 = MULTIPLY(z1, - FIX_0_509795579) /* sqrt(2) * (c7-c5) */

	241 + MULTIPLY(z2, - FIX_0_601344887) /* sqrt(2) * (c5-c1) */

	242 + MULTIPLY(z3, FIX_0_899976223) /* sqrt(2) * (c3-c7) */

	243 + MULTIPLY(z4, FIX_2_562915447); /* sqrt(2) * (c1+c3) */

	244

	245 /* Final output stage */

	246

	247 outptr[0] = range_limit[(int) DESCALE(tmp10 + tmp2,

	248 CONST_BITS+PASS1_BITS+3+1)

	249 & RANGE_MASK];

	250 outptr[3] = range_limit[(int) DESCALE(tmp10 - tmp2,

	251 CONST_BITS+PASS1_BITS+3+1)

	252 & RANGE_MASK];

	253 outptr[1] = range_limit[(int) DESCALE(tmp12 + tmp0,

	254 CONST_BITS+PASS1_BITS+3+1)

	255 & RANGE_MASK];

	256 outptr[2] = range_limit[(int) DESCALE(tmp12 - tmp0,

	257 CONST_BITS+PASS1_BITS+3+1)

	258 & RANGE_MASK];

	259

	260 wsptr += DCTSIZE; /* advance pointer to next row */

	261 }

	262 }

	263

	264

	265 /*

	266 * Perform dequantization and inverse DCT on one block of coefficients,

	267 * producing a reduced-size 2x2 output block.

	268 */

	269

	270 GLOBAL(void)

	271 jpeg_idct_2x2 (j_decompress_ptr cinfo, jpeg_component_info * compptr,

	272 JCOEFPTR coef_block,

	273 JSAMPARRAY output_buf, JDIMENSION output_col)

	274 {

	275 INT32 tmp0, tmp10, z1;

	276 JCOEFPTR inptr;

	277 ISLOW_MULT_TYPE * quantptr;

	278 int * wsptr;

	279 JSAMPROW outptr;

	280 JSAMPLE *range_limit = IDCT_range_limit(cinfo);

	281 int ctr;

	282 int workspace[DCTSIZE2]; / buffers data between passes */

	283 SHIFT_TEMPS

	284

	285 /* Pass 1: process columns from input, store into work array. */

	286

	287 inptr = coef_block;

	288 quantptr = (ISLOW_MULT_TYPE *) compptr->dct_table;

	289 wsptr = workspace;

	290 for (ctr = DCTSIZE; ctr > 0; inptr++, quantptr++, wsptr++, ctr--) {

	291 /* Don't bother to process columns 2,4,6 */

	292 if (ctr == DCTSIZE-2 \|\| ctr == DCTSIZE-4 \|\| ctr == DCTSIZE-6)

	293 continue;

	294 if (inptr[DCTSIZE1] == 0 && inptr[DCTSIZE3] == 0 &&

	295 inptr[DCTSIZE5] == 0 && inptr[DCTSIZE7] == 0) {

	296 /* AC terms all zero; we need not examine terms 2,4,6 for 2x2 output */

	297 int dcval = DEQUANTIZE(inptr[DCTSIZE0], quantptr[DCTSIZE0]) << PASS1_BIT S;

	298

	299 wsptr[DCTSIZE*0] = dcval;

	300 wsptr[DCTSIZE*1] = dcval;

	301

	302 continue;

	303 }

	304

	305 /* Even part */

	306

	307 z1 = DEQUANTIZE(inptr[DCTSIZE0], quantptr[DCTSIZE0]);

	308 tmp10 = z1 << (CONST_BITS+2);

	309

	310 /* Odd part */

	311

	312 z1 = DEQUANTIZE(inptr[DCTSIZE7], quantptr[DCTSIZE7]);

	313 tmp0 = MULTIPLY(z1, - FIX_0_720959822); /* sqrt(2) * (c7-c5+c3-c1) */

	314 z1 = DEQUANTIZE(inptr[DCTSIZE5], quantptr[DCTSIZE5]);

	315 tmp0 += MULTIPLY(z1, FIX_0_850430095); /* sqrt(2) * (-c1+c3+c5+c7) */

	316 z1 = DEQUANTIZE(inptr[DCTSIZE3], quantptr[DCTSIZE3]);

	317 tmp0 += MULTIPLY(z1, - FIX_1_272758580); /* sqrt(2) * (-c1+c3-c5-c7) */

	318 z1 = DEQUANTIZE(inptr[DCTSIZE1], quantptr[DCTSIZE1]);

	319 tmp0 += MULTIPLY(z1, FIX_3_624509785); /* sqrt(2) * (c1+c3+c5+c7) */

	320

	321 /* Final output stage */

	322

	323 wsptr[DCTSIZE*0] = (int) DESCALE(tmp10 + tmp0, CONST_BITS-PASS1_BITS+2);

	324 wsptr[DCTSIZE*1] = (int) DESCALE(tmp10 - tmp0, CONST_BITS-PASS1_BITS+2);

	325 }

	326

	327 /* Pass 2: process 2 rows from work array, store into output array. */

	328

	329 wsptr = workspace;

	330 for (ctr = 0; ctr < 2; ctr++) {

	331 outptr = output_buf[ctr] + output_col;

	332 /* It's not clear whether a zero row test is worthwhile here ... */

	333

	334 #ifndef NO_ZERO_ROW_TEST

	335 if (wsptr[1] == 0 && wsptr[3] == 0 && wsptr[5] == 0 && wsptr[7] == 0) {

	336 /* AC terms all zero */

	337 JSAMPLE dcval = range_limit[(int) DESCALE((INT32) wsptr[0], PASS1_BITS+3)

	338 & RANGE_MASK];

	339

	340 outptr[0] = dcval;

	341 outptr[1] = dcval;

	342

	343 wsptr += DCTSIZE; /* advance pointer to next row */

	344 continue;

	345 }

	346 #endif

	347

	348 /* Even part */

	349

	350 tmp10 = ((INT32) wsptr[0]) << (CONST_BITS+2);

	351

	352 /* Odd part */

	353

	354 tmp0 = MULTIPLY((INT32) wsptr[7], - FIX_0_720959822) /* sqrt(2) * (c7-c5+c3- c1) */

	355 + MULTIPLY((INT32) wsptr[5], FIX_0_850430095) /* sqrt(2) * (-c1+c3+c5+c 7) */

	356 + MULTIPLY((INT32) wsptr[3], - FIX_1_272758580) /* sqrt(2) * (-c1+c3-c5 -c7) */

	357 + MULTIPLY((INT32) wsptr[1], FIX_3_624509785); /* sqrt(2) * (c1+c3+c5+c 7) */

	358

	359 /* Final output stage */

	360

	361 outptr[0] = range_limit[(int) DESCALE(tmp10 + tmp0,

	362 CONST_BITS+PASS1_BITS+3+2)

	363 & RANGE_MASK];

	364 outptr[1] = range_limit[(int) DESCALE(tmp10 - tmp0,

	365 CONST_BITS+PASS1_BITS+3+2)

	366 & RANGE_MASK];

	367

	368 wsptr += DCTSIZE; /* advance pointer to next row */

	369 }

	370 }

	371

	372

	373 /*

	374 * Perform dequantization and inverse DCT on one block of coefficients,

	375 * producing a reduced-size 1x1 output block.

	376 */

	377

	378 GLOBAL(void)

	379 jpeg_idct_1x1 (j_decompress_ptr cinfo, jpeg_component_info * compptr,

	380 JCOEFPTR coef_block,

	381 JSAMPARRAY output_buf, JDIMENSION output_col)

	382 {

	383 int dcval;

	384 ISLOW_MULT_TYPE * quantptr;

	385 JSAMPLE *range_limit = IDCT_range_limit(cinfo);

	386 SHIFT_TEMPS

	387

	388 /* We hardly need an inverse DCT routine for this: just take the

	389 * average pixel value, which is one-eighth of the DC coefficient.

	390 */

	391 quantptr = (ISLOW_MULT_TYPE *) compptr->dct_table;

	392 dcval = DEQUANTIZE(coef_block[0], quantptr[0]);

	393 dcval = (int) DESCALE((INT32) dcval, 3);

	394

	395 output_buf[0][output_col] = range_limit[dcval & RANGE_MASK];

	396 }

	397

	398 #endif /* IDCT_SCALING_SUPPORTED */

OLD	NEW

« no previous file with comments | « third_party/libjpeg_turbo/jidctint.c ('k') | third_party/libjpeg_turbo/jinclude.h » ('j') | no next file with comments »