| Index: jccolor.c | 
| diff --git a/jccolor.c b/jccolor.c | 
| index 94b41840b59610d78c05d5382000848d73a7ccff..a93498ab083dda28e274e66e5576f9e538422aa5 100644 | 
| --- a/jccolor.c | 
| +++ b/jccolor.c | 
| @@ -5,8 +5,10 @@ | 
| * Copyright (C) 1991-1996, Thomas G. Lane. | 
| * libjpeg-turbo Modifications: | 
| * Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB | 
| - * Copyright (C) 2009-2012, D. R. Commander. | 
| - * For conditions of distribution and use, see the accompanying README file. | 
| + * Copyright (C) 2009-2012, 2015 D. R. Commander. | 
| + * Copyright (C) 2014, MIPS Technologies, Inc., California | 
| + * For conditions of distribution and use, see the accompanying README.ijg | 
| + * file. | 
| * | 
| * This file contains input colorspace conversion routines. | 
| */ | 
| @@ -15,7 +17,7 @@ | 
| #include "jinclude.h" | 
| #include "jpeglib.h" | 
| #include "jsimd.h" | 
| -#include "config.h" | 
| +#include "jconfigint.h" | 
|  | 
|  | 
| /* Private subobject */ | 
| @@ -24,10 +26,10 @@ typedef struct { | 
| struct jpeg_color_converter pub; /* public fields */ | 
|  | 
| /* Private state for RGB->YCC conversion */ | 
| -  INT32 * rgb_ycc_tab;		/* => table for RGB to YCbCr conversion */ | 
| +  JLONG *rgb_ycc_tab;           /* => table for RGB to YCbCr conversion */ | 
| } my_color_converter; | 
|  | 
| -typedef my_color_converter * my_cconvert_ptr; | 
| +typedef my_color_converter *my_cconvert_ptr; | 
|  | 
|  | 
| /**************** RGB -> YCbCr conversion: most common case **************/ | 
| @@ -36,9 +38,9 @@ typedef my_color_converter * my_cconvert_ptr; | 
| * YCbCr is defined per CCIR 601-1, except that Cb and Cr are | 
| * normalized to the range 0..MAXJSAMPLE rather than -0.5 .. 0.5. | 
| * The conversion equations to be implemented are therefore | 
| - *	Y  =  0.29900 * R + 0.58700 * G + 0.11400 * B | 
| - *	Cb = -0.16874 * R - 0.33126 * G + 0.50000 * B  + CENTERJSAMPLE | 
| - *	Cr =  0.50000 * R - 0.41869 * G - 0.08131 * B  + CENTERJSAMPLE | 
| + *      Y  =  0.29900 * R + 0.58700 * G + 0.11400 * B | 
| + *      Cb = -0.16874 * R - 0.33126 * G + 0.50000 * B  + CENTERJSAMPLE | 
| + *      Cr =  0.50000 * R - 0.41869 * G - 0.08131 * B  + CENTERJSAMPLE | 
| * (These numbers are derived from TIFF 6.0 section 21, dated 3-June-92.) | 
| * Note: older versions of the IJG code used a zero offset of MAXJSAMPLE/2, | 
| * rather than CENTERJSAMPLE, for Cb and Cr.  This gave equal positive and | 
| @@ -60,10 +62,10 @@ typedef my_color_converter * my_cconvert_ptr; | 
| * in the tables to save adding them separately in the inner loop. | 
| */ | 
|  | 
| -#define SCALEBITS	16	/* speediest right-shift on some machines */ | 
| -#define CBCR_OFFSET	((INT32) CENTERJSAMPLE << SCALEBITS) | 
| -#define ONE_HALF	((INT32) 1 << (SCALEBITS-1)) | 
| -#define FIX(x)		((INT32) ((x) * (1L<<SCALEBITS) + 0.5)) | 
| +#define SCALEBITS       16      /* speediest right-shift on some machines */ | 
| +#define CBCR_OFFSET     ((JLONG) CENTERJSAMPLE << SCALEBITS) | 
| +#define ONE_HALF        ((JLONG) 1 << (SCALEBITS-1)) | 
| +#define FIX(x)          ((JLONG) ((x) * (1L<<SCALEBITS) + 0.5)) | 
|  | 
| /* We allocate one big table and divide it up into eight parts, instead of | 
| * doing eight alloc_small requests.  This lets us use a single table base | 
| @@ -71,16 +73,16 @@ typedef my_color_converter * my_cconvert_ptr; | 
| * machines (more than can hold all eight addresses, anyway). | 
| */ | 
|  | 
| -#define R_Y_OFF		0			/* offset to R => Y section */ | 
| -#define G_Y_OFF		(1*(MAXJSAMPLE+1))	/* offset to G => Y section */ | 
| -#define B_Y_OFF		(2*(MAXJSAMPLE+1))	/* etc. */ | 
| -#define R_CB_OFF	(3*(MAXJSAMPLE+1)) | 
| -#define G_CB_OFF	(4*(MAXJSAMPLE+1)) | 
| -#define B_CB_OFF	(5*(MAXJSAMPLE+1)) | 
| -#define R_CR_OFF	B_CB_OFF		/* B=>Cb, R=>Cr are the same */ | 
| -#define G_CR_OFF	(6*(MAXJSAMPLE+1)) | 
| -#define B_CR_OFF	(7*(MAXJSAMPLE+1)) | 
| -#define TABLE_SIZE	(8*(MAXJSAMPLE+1)) | 
| +#define R_Y_OFF         0                       /* offset to R => Y section */ | 
| +#define G_Y_OFF         (1*(MAXJSAMPLE+1))      /* offset to G => Y section */ | 
| +#define B_Y_OFF         (2*(MAXJSAMPLE+1))      /* etc. */ | 
| +#define R_CB_OFF        (3*(MAXJSAMPLE+1)) | 
| +#define G_CB_OFF        (4*(MAXJSAMPLE+1)) | 
| +#define B_CB_OFF        (5*(MAXJSAMPLE+1)) | 
| +#define R_CR_OFF        B_CB_OFF                /* B=>Cb, R=>Cr are the same */ | 
| +#define G_CR_OFF        (6*(MAXJSAMPLE+1)) | 
| +#define B_CR_OFF        (7*(MAXJSAMPLE+1)) | 
| +#define TABLE_SIZE      (8*(MAXJSAMPLE+1)) | 
|  | 
|  | 
| /* Include inline routines for colorspace extensions */ | 
| @@ -196,13 +198,13 @@ METHODDEF(void) | 
| rgb_ycc_start (j_compress_ptr cinfo) | 
| { | 
| my_cconvert_ptr cconvert = (my_cconvert_ptr) cinfo->cconvert; | 
| -  INT32 * rgb_ycc_tab; | 
| -  INT32 i; | 
| +  JLONG *rgb_ycc_tab; | 
| +  JLONG i; | 
|  | 
| /* Allocate and fill in the conversion tables. */ | 
| -  cconvert->rgb_ycc_tab = rgb_ycc_tab = (INT32 *) | 
| +  cconvert->rgb_ycc_tab = rgb_ycc_tab = (JLONG *) | 
| (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE, | 
| -				(TABLE_SIZE * SIZEOF(INT32))); | 
| +                                (TABLE_SIZE * sizeof(JLONG))); | 
|  | 
| for (i = 0; i <= MAXJSAMPLE; i++) { | 
| rgb_ycc_tab[i+R_Y_OFF] = FIX(0.29900) * i; | 
| @@ -230,8 +232,8 @@ rgb_ycc_start (j_compress_ptr cinfo) | 
|  | 
| METHODDEF(void) | 
| rgb_ycc_convert (j_compress_ptr cinfo, | 
| -		 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| -		 JDIMENSION output_row, int num_rows) | 
| +                 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| +                 JDIMENSION output_row, int num_rows) | 
| { | 
| switch (cinfo->in_color_space) { | 
| case JCS_EXT_RGB: | 
| @@ -279,8 +281,8 @@ rgb_ycc_convert (j_compress_ptr cinfo, | 
|  | 
| METHODDEF(void) | 
| rgb_gray_convert (j_compress_ptr cinfo, | 
| -		  JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| -		  JDIMENSION output_row, int num_rows) | 
| +                  JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| +                  JDIMENSION output_row, int num_rows) | 
| { | 
| switch (cinfo->in_color_space) { | 
| case JCS_EXT_RGB: | 
| @@ -325,8 +327,8 @@ rgb_gray_convert (j_compress_ptr cinfo, | 
|  | 
| METHODDEF(void) | 
| rgb_rgb_convert (j_compress_ptr cinfo, | 
| -		  JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| -		  JDIMENSION output_row, int num_rows) | 
| +                  JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| +                  JDIMENSION output_row, int num_rows) | 
| { | 
| switch (cinfo->in_color_space) { | 
| case JCS_EXT_RGB: | 
| @@ -375,12 +377,12 @@ rgb_rgb_convert (j_compress_ptr cinfo, | 
|  | 
| METHODDEF(void) | 
| cmyk_ycck_convert (j_compress_ptr cinfo, | 
| -		   JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| -		   JDIMENSION output_row, int num_rows) | 
| +                   JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| +                   JDIMENSION output_row, int num_rows) | 
| { | 
| my_cconvert_ptr cconvert = (my_cconvert_ptr) cinfo->cconvert; | 
| register int r, g, b; | 
| -  register INT32 * ctab = cconvert->rgb_ycc_tab; | 
| +  register JLONG *ctab = cconvert->rgb_ycc_tab; | 
| register JSAMPROW inptr; | 
| register JSAMPROW outptr0, outptr1, outptr2, outptr3; | 
| register JDIMENSION col; | 
| @@ -398,7 +400,7 @@ cmyk_ycck_convert (j_compress_ptr cinfo, | 
| g = MAXJSAMPLE - GETJSAMPLE(inptr[1]); | 
| b = MAXJSAMPLE - GETJSAMPLE(inptr[2]); | 
| /* K passes through as-is */ | 
| -      outptr3[col] = inptr[3];	/* don't need GETJSAMPLE here */ | 
| +      outptr3[col] = inptr[3];  /* don't need GETJSAMPLE here */ | 
| inptr += 4; | 
| /* If the inputs are 0..MAXJSAMPLE, the outputs of these equations | 
| * must be too; we do not need an explicit range-limiting operation. | 
| @@ -407,16 +409,16 @@ cmyk_ycck_convert (j_compress_ptr cinfo, | 
| */ | 
| /* Y */ | 
| outptr0[col] = (JSAMPLE) | 
| -		((ctab[r+R_Y_OFF] + ctab[g+G_Y_OFF] + ctab[b+B_Y_OFF]) | 
| -		 >> SCALEBITS); | 
| +                ((ctab[r+R_Y_OFF] + ctab[g+G_Y_OFF] + ctab[b+B_Y_OFF]) | 
| +                 >> SCALEBITS); | 
| /* Cb */ | 
| outptr1[col] = (JSAMPLE) | 
| -		((ctab[r+R_CB_OFF] + ctab[g+G_CB_OFF] + ctab[b+B_CB_OFF]) | 
| -		 >> SCALEBITS); | 
| +                ((ctab[r+R_CB_OFF] + ctab[g+G_CB_OFF] + ctab[b+B_CB_OFF]) | 
| +                 >> SCALEBITS); | 
| /* Cr */ | 
| outptr2[col] = (JSAMPLE) | 
| -		((ctab[r+R_CR_OFF] + ctab[g+G_CR_OFF] + ctab[b+B_CR_OFF]) | 
| -		 >> SCALEBITS); | 
| +                ((ctab[r+R_CR_OFF] + ctab[g+G_CR_OFF] + ctab[b+B_CR_OFF]) | 
| +                 >> SCALEBITS); | 
| } | 
| } | 
| } | 
| @@ -430,8 +432,8 @@ cmyk_ycck_convert (j_compress_ptr cinfo, | 
|  | 
| METHODDEF(void) | 
| grayscale_convert (j_compress_ptr cinfo, | 
| -		   JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| -		   JDIMENSION output_row, int num_rows) | 
| +                   JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| +                   JDIMENSION output_row, int num_rows) | 
| { | 
| register JSAMPROW inptr; | 
| register JSAMPROW outptr; | 
| @@ -444,7 +446,7 @@ grayscale_convert (j_compress_ptr cinfo, | 
| outptr = output_buf[0][output_row]; | 
| output_row++; | 
| for (col = 0; col < num_cols; col++) { | 
| -      outptr[col] = inptr[0];	/* don't need GETJSAMPLE() here */ | 
| +      outptr[col] = inptr[0];   /* don't need GETJSAMPLE() here */ | 
| inptr += instride; | 
| } | 
| } | 
| @@ -459,28 +461,58 @@ grayscale_convert (j_compress_ptr cinfo, | 
|  | 
| METHODDEF(void) | 
| null_convert (j_compress_ptr cinfo, | 
| -	      JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| -	      JDIMENSION output_row, int num_rows) | 
| +              JSAMPARRAY input_buf, JSAMPIMAGE output_buf, | 
| +              JDIMENSION output_row, int num_rows) | 
| { | 
| register JSAMPROW inptr; | 
| -  register JSAMPROW outptr; | 
| +  register JSAMPROW outptr, outptr0, outptr1, outptr2, outptr3; | 
| register JDIMENSION col; | 
| register int ci; | 
| int nc = cinfo->num_components; | 
| JDIMENSION num_cols = cinfo->image_width; | 
|  | 
| -  while (--num_rows >= 0) { | 
| -    /* It seems fastest to make a separate pass for each component. */ | 
| -    for (ci = 0; ci < nc; ci++) { | 
| -      inptr = *input_buf; | 
| -      outptr = output_buf[ci][output_row]; | 
| +  if (nc == 3) { | 
| +    while (--num_rows >= 0) { | 
| +      inptr = *input_buf++; | 
| +      outptr0 = output_buf[0][output_row]; | 
| +      outptr1 = output_buf[1][output_row]; | 
| +      outptr2 = output_buf[2][output_row]; | 
| +      output_row++; | 
| for (col = 0; col < num_cols; col++) { | 
| -	outptr[col] = inptr[ci]; /* don't need GETJSAMPLE() here */ | 
| -	inptr += nc; | 
| +        outptr0[col] = *inptr++; | 
| +        outptr1[col] = *inptr++; | 
| +        outptr2[col] = *inptr++; | 
| } | 
| } | 
| -    input_buf++; | 
| -    output_row++; | 
| +  } else if (nc == 4) { | 
| +    while (--num_rows >= 0) { | 
| +      inptr = *input_buf++; | 
| +      outptr0 = output_buf[0][output_row]; | 
| +      outptr1 = output_buf[1][output_row]; | 
| +      outptr2 = output_buf[2][output_row]; | 
| +      outptr3 = output_buf[3][output_row]; | 
| +      output_row++; | 
| +      for (col = 0; col < num_cols; col++) { | 
| +        outptr0[col] = *inptr++; | 
| +        outptr1[col] = *inptr++; | 
| +        outptr2[col] = *inptr++; | 
| +        outptr3[col] = *inptr++; | 
| +      } | 
| +    } | 
| +  } else { | 
| +    while (--num_rows >= 0) { | 
| +      /* It seems fastest to make a separate pass for each component. */ | 
| +      for (ci = 0; ci < nc; ci++) { | 
| +        inptr = *input_buf; | 
| +        outptr = output_buf[ci][output_row]; | 
| +        for (col = 0; col < num_cols; col++) { | 
| +          outptr[col] = inptr[ci]; /* don't need GETJSAMPLE() here */ | 
| +          inptr += nc; | 
| +        } | 
| +      } | 
| +      input_buf++; | 
| +      output_row++; | 
| +    } | 
| } | 
| } | 
|  | 
| @@ -507,7 +539,7 @@ jinit_color_converter (j_compress_ptr cinfo) | 
|  | 
| cconvert = (my_cconvert_ptr) | 
| (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE, | 
| -				SIZEOF(my_color_converter)); | 
| +                                sizeof(my_color_converter)); | 
| cinfo->cconvert = (struct jpeg_color_converter *) cconvert; | 
| /* set start_pass to null method until we find out differently */ | 
| cconvert->pub.start_pass = null_method; | 
| @@ -545,7 +577,7 @@ jinit_color_converter (j_compress_ptr cinfo) | 
| ERREXIT(cinfo, JERR_BAD_IN_COLORSPACE); | 
| break; | 
|  | 
| -  default:			/* JCS_UNKNOWN can be anything */ | 
| +  default:                      /* JCS_UNKNOWN can be anything */ | 
| if (cinfo->input_components < 1) | 
| ERREXIT(cinfo, JERR_BAD_IN_COLORSPACE); | 
| break; | 
| @@ -587,19 +619,24 @@ jinit_color_converter (j_compress_ptr cinfo) | 
| if (rgb_red[cinfo->in_color_space] == 0 && | 
| rgb_green[cinfo->in_color_space] == 1 && | 
| rgb_blue[cinfo->in_color_space] == 2 && | 
| -        rgb_pixelsize[cinfo->in_color_space] == 3) | 
| -      cconvert->pub.color_convert = null_convert; | 
| -    else if (cinfo->in_color_space == JCS_RGB || | 
| -             cinfo->in_color_space == JCS_EXT_RGB || | 
| -             cinfo->in_color_space == JCS_EXT_RGBX || | 
| -             cinfo->in_color_space == JCS_EXT_BGR || | 
| -             cinfo->in_color_space == JCS_EXT_BGRX || | 
| -             cinfo->in_color_space == JCS_EXT_XBGR || | 
| -             cinfo->in_color_space == JCS_EXT_XRGB || | 
| -             cinfo->in_color_space == JCS_EXT_RGBA || | 
| -             cinfo->in_color_space == JCS_EXT_BGRA || | 
| -             cinfo->in_color_space == JCS_EXT_ABGR || | 
| -             cinfo->in_color_space == JCS_EXT_ARGB) | 
| +        rgb_pixelsize[cinfo->in_color_space] == 3) { | 
| +#if defined(__mips__) | 
| +      if (jsimd_c_can_null_convert()) | 
| +        cconvert->pub.color_convert = jsimd_c_null_convert; | 
| +      else | 
| +#endif | 
| +        cconvert->pub.color_convert = null_convert; | 
| +    } else if (cinfo->in_color_space == JCS_RGB || | 
| +               cinfo->in_color_space == JCS_EXT_RGB || | 
| +               cinfo->in_color_space == JCS_EXT_RGBX || | 
| +               cinfo->in_color_space == JCS_EXT_BGR || | 
| +               cinfo->in_color_space == JCS_EXT_BGRX || | 
| +               cinfo->in_color_space == JCS_EXT_XBGR || | 
| +               cinfo->in_color_space == JCS_EXT_XRGB || | 
| +               cinfo->in_color_space == JCS_EXT_RGBA || | 
| +               cinfo->in_color_space == JCS_EXT_BGRA || | 
| +               cinfo->in_color_space == JCS_EXT_ABGR || | 
| +               cinfo->in_color_space == JCS_EXT_ARGB) | 
| cconvert->pub.color_convert = rgb_rgb_convert; | 
| else | 
| ERREXIT(cinfo, JERR_CONVERSION_NOTIMPL); | 
| @@ -625,18 +662,28 @@ jinit_color_converter (j_compress_ptr cinfo) | 
| cconvert->pub.start_pass = rgb_ycc_start; | 
| cconvert->pub.color_convert = rgb_ycc_convert; | 
| } | 
| -    } else if (cinfo->in_color_space == JCS_YCbCr) | 
| -      cconvert->pub.color_convert = null_convert; | 
| -    else | 
| +    } else if (cinfo->in_color_space == JCS_YCbCr) { | 
| +#if defined(__mips__) | 
| +      if (jsimd_c_can_null_convert()) | 
| +        cconvert->pub.color_convert = jsimd_c_null_convert; | 
| +      else | 
| +#endif | 
| +        cconvert->pub.color_convert = null_convert; | 
| +    } else | 
| ERREXIT(cinfo, JERR_CONVERSION_NOTIMPL); | 
| break; | 
|  | 
| case JCS_CMYK: | 
| if (cinfo->num_components != 4) | 
| ERREXIT(cinfo, JERR_BAD_J_COLORSPACE); | 
| -    if (cinfo->in_color_space == JCS_CMYK) | 
| -      cconvert->pub.color_convert = null_convert; | 
| -    else | 
| +    if (cinfo->in_color_space == JCS_CMYK) { | 
| +#if defined(__mips__) | 
| +      if (jsimd_c_can_null_convert()) | 
| +        cconvert->pub.color_convert = jsimd_c_null_convert; | 
| +      else | 
| +#endif | 
| +        cconvert->pub.color_convert = null_convert; | 
| +    } else | 
| ERREXIT(cinfo, JERR_CONVERSION_NOTIMPL); | 
| break; | 
|  | 
| @@ -646,17 +693,27 @@ jinit_color_converter (j_compress_ptr cinfo) | 
| if (cinfo->in_color_space == JCS_CMYK) { | 
| cconvert->pub.start_pass = rgb_ycc_start; | 
| cconvert->pub.color_convert = cmyk_ycck_convert; | 
| -    } else if (cinfo->in_color_space == JCS_YCCK) | 
| -      cconvert->pub.color_convert = null_convert; | 
| -    else | 
| +    } else if (cinfo->in_color_space == JCS_YCCK) { | 
| +#if defined(__mips__) | 
| +      if (jsimd_c_can_null_convert()) | 
| +        cconvert->pub.color_convert = jsimd_c_null_convert; | 
| +      else | 
| +#endif | 
| +        cconvert->pub.color_convert = null_convert; | 
| +    } else | 
| ERREXIT(cinfo, JERR_CONVERSION_NOTIMPL); | 
| break; | 
|  | 
| -  default:			/* allow null conversion of JCS_UNKNOWN */ | 
| +  default:                      /* allow null conversion of JCS_UNKNOWN */ | 
| if (cinfo->jpeg_color_space != cinfo->in_color_space || | 
| -	cinfo->num_components != cinfo->input_components) | 
| +        cinfo->num_components != cinfo->input_components) | 
| ERREXIT(cinfo, JERR_CONVERSION_NOTIMPL); | 
| -    cconvert->pub.color_convert = null_convert; | 
| +#if defined(__mips__) | 
| +    if (jsimd_c_can_null_convert()) | 
| +      cconvert->pub.color_convert = jsimd_c_null_convert; | 
| +    else | 
| +#endif | 
| +      cconvert->pub.color_convert = null_convert; | 
| break; | 
| } | 
| } | 
|  |