Home | History | Annotate | Download | only in qcms
      1 diff --git a/third_party/qcms/src/iccread.c b/third_party/qcms/src/iccread.c
      2 index 36b7011..9ee6b94 100644
      3 --- a/third_party/qcms/src/iccread.c
      4 +++ b/third_party/qcms/src/iccread.c
      5 @@ -266,7 +266,7 @@ qcms_bool qcms_profile_is_bogus(qcms_profile *profile)
      6         if (profile->color_space != RGB_SIGNATURE)
      7  	       return false;
      8  
      9 -       if (profile->A2B0 || profile->B2A0)
     10 +       if (qcms_supports_iccv4 && (profile->A2B0 || profile->B2A0))
     11                 return false;
     12  
     13         rX = s15Fixed16Number_to_float(profile->redColorant.X);
     14 @@ -297,6 +297,11 @@ qcms_bool qcms_profile_is_bogus(qcms_profile *profile)
     15         sum[1] = rY + gY + bY;
     16         sum[2] = rZ + gZ + bZ;
     17  
     18 +#if defined (_MSC_VER)
     19 +#pragma warning(push)
     20 +/* Disable double to float truncation warning 4305 */
     21 +#pragma warning(disable:4305)
     22 +#endif
     23         // Build our target vector (see mozilla bug 460629)
     24         target[0] = 0.96420;
     25         target[1] = 1.00000;
     26 @@ -310,6 +315,10 @@ qcms_bool qcms_profile_is_bogus(qcms_profile *profile)
     27         tolerance[1] = 0.02;
     28         tolerance[2] = 0.04;
     29  
     30 +#if defined (_MSC_VER)
     31 +/* Restore warnings */
     32 +#pragma warning(pop)
     33 +#endif
     34         // Compare with our tolerance
     35         for (i = 0; i < 3; ++i) {
     36             if (!(((sum[i] - tolerance[i]) <= target[i]) &&
     37 @@ -402,7 +411,7 @@ static struct XYZNumber read_tag_XYZType(struct mem_source *src, struct tag_inde
     38  // present that are not part of the tag_index.
     39  static struct curveType *read_curveType(struct mem_source *src, uint32_t offset, uint32_t *len)
     40  {
     41 -	static const size_t COUNT_TO_LENGTH[5] = {1, 3, 4, 5, 7};
     42 +	static const uint32_t COUNT_TO_LENGTH[5] = {1, 3, 4, 5, 7};
     43  	struct curveType *curve = NULL;
     44  	uint32_t type = read_u32(src, offset);
     45  	uint32_t count;
     46 @@ -657,7 +666,7 @@ static struct lutType *read_tag_lutType(struct mem_source *src, struct tag_index
     47  	uint16_t num_input_table_entries;
     48  	uint16_t num_output_table_entries;
     49  	uint8_t in_chan, grid_points, out_chan;
     50 -	uint32_t clut_offset, output_offset;
     51 +	size_t clut_offset, output_offset;
     52  	uint32_t clut_size;
     53  	size_t entry_size;
     54  	struct lutType *lut;
     55 @@ -997,6 +1006,9 @@ qcms_profile* qcms_profile_from_memory(const void *mem, size_t size)
     56  	source.size = size;
     57  	source.valid = true;
     58  
     59 +	if (size < 4)
     60 +		return INVALID_PROFILE;
     61 +
     62  	length = read_u32(src, 0);
     63  	if (length <= size) {
     64  		// shrink the area that we can read if appropriate
     65 diff --git a/third_party/qcms/src/qcms.h b/third_party/qcms/src/qcms.h
     66 index 7d83623..11fe222 100644
     67 --- a/third_party/qcms/src/qcms.h
     68 +++ b/third_party/qcms/src/qcms.h
     69 @@ -40,6 +40,12 @@ sale, use or other dealings in this Software without written
     70  authorization from SunSoft Inc. 
     71  ******************************************************************/
     72  
     73 +/*
     74 + * QCMS, in general, is not threadsafe. However, it should be safe to create
     75 + * profile and transformation objects on different threads, so long as you
     76 + * don't use the same objects on different threads at the same time.
     77 + */
     78 +
     79  /* 
     80   * Color Space Signatures
     81   * Note that only icSigXYZData and icSigLabData are valid
     82 @@ -102,6 +108,12 @@ typedef enum {
     83  	QCMS_DATA_GRAYA_8
     84  } qcms_data_type;
     85  
     86 +/* Format of the output data for qcms_transform_data_type() */
     87 +typedef enum {
     88 +	QCMS_OUTPUT_RGBX,
     89 +	QCMS_OUTPUT_BGRX
     90 +} qcms_output_type;
     91 +
     92  /* the names for the following two types are sort of ugly */
     93  typedef struct
     94  {
     95 @@ -146,6 +158,7 @@ qcms_transform* qcms_transform_create(
     96  void qcms_transform_release(qcms_transform *);
     97  
     98  void qcms_transform_data(qcms_transform *transform, void *src, void *dest, size_t length);
     99 +void qcms_transform_data_type(qcms_transform *transform, void *src, void *dest, size_t length, qcms_output_type type);
    100  
    101  void qcms_enable_iccv4();
    102  
    103 diff --git a/third_party/qcms/src/qcmsint.h b/third_party/qcms/src/qcmsint.h
    104 index 53a3420..fb53e96 100644
    105 --- a/third_party/qcms/src/qcmsint.h
    106 +++ b/third_party/qcms/src/qcmsint.h
    107 @@ -45,6 +45,11 @@ struct precache_output
    108  #define ALIGN __attribute__(( aligned (16) ))
    109  #endif
    110  
    111 +typedef struct _qcms_format_type {
    112 +	int r;
    113 +	int b;
    114 +} qcms_format_type;
    115 +
    116  struct _qcms_transform {
    117  	float ALIGN matrix[3][4];
    118  	float *input_gamma_table_r;
    119 @@ -88,7 +93,7 @@ struct _qcms_transform {
    120  	struct precache_output *output_table_g;
    121  	struct precache_output *output_table_b;
    122  
    123 -	void (*transform_fn)(struct _qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length);
    124 +	void (*transform_fn)(struct _qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, struct _qcms_format_type output_format);
    125  };
    126  
    127  struct matrix {
    128 @@ -280,18 +285,40 @@ qcms_bool set_rgb_colorants(qcms_profile *profile, qcms_CIE_xyY white_point, qcm
    129  void qcms_transform_data_rgb_out_lut_sse2(qcms_transform *transform,
    130                                            unsigned char *src,
    131                                            unsigned char *dest,
    132 -                                          size_t length);
    133 +                                          size_t length,
    134 +                                          qcms_format_type output_format);
    135  void qcms_transform_data_rgba_out_lut_sse2(qcms_transform *transform,
    136                                            unsigned char *src,
    137                                            unsigned char *dest,
    138 -                                          size_t length);
    139 +                                          size_t length,
    140 +                                          qcms_format_type output_format);
    141  void qcms_transform_data_rgb_out_lut_sse1(qcms_transform *transform,
    142                                            unsigned char *src,
    143                                            unsigned char *dest,
    144 -                                          size_t length);
    145 +                                          size_t length,
    146 +                                          qcms_format_type output_format);
    147  void qcms_transform_data_rgba_out_lut_sse1(qcms_transform *transform,
    148                                            unsigned char *src,
    149                                            unsigned char *dest,
    150 -                                          size_t length);
    151 +                                          size_t length,
    152 +                                          qcms_format_type output_format);
    153  
    154  extern qcms_bool qcms_supports_iccv4;
    155 +
    156 +
    157 +#ifdef _MSC_VER
    158 +
    159 +long __cdecl _InterlockedIncrement(long volatile *);
    160 +long __cdecl _InterlockedDecrement(long volatile *);
    161 +#pragma intrinsic(_InterlockedIncrement)
    162 +#pragma intrinsic(_InterlockedDecrement)
    163 +
    164 +#define qcms_atomic_increment(x) _InterlockedIncrement((long volatile *)&x)
    165 +#define qcms_atomic_decrement(x) _InterlockedDecrement((long volatile*)&x)
    166 +
    167 +#else
    168 +
    169 +#define qcms_atomic_increment(x) __sync_add_and_fetch(&x, 1)
    170 +#define qcms_atomic_decrement(x) __sync_sub_and_fetch(&x, 1)
    171 +
    172 +#endif
    173 diff --git a/third_party/qcms/src/qcmstypes.h b/third_party/qcms/src/qcmstypes.h
    174 index 56d8de3..d58f691 100644
    175 --- a/third_party/qcms/src/qcmstypes.h
    176 +++ b/third_party/qcms/src/qcmstypes.h
    177 @@ -22,37 +22,6 @@
    178  #ifndef QCMS_TYPES_H
    179  #define QCMS_TYPES_H
    180  
    181 -#ifdef MOZ_QCMS
    182 -
    183 -#include "prtypes.h"
    184 -
    185 -/* prtypes.h defines IS_LITTLE_ENDIAN and IS_BIG ENDIAN */
    186 -
    187 -#if defined (__SVR4) && defined (__sun)
    188 -/* int_types.h gets included somehow, so avoid redefining the types differently */
    189 -#include <sys/int_types.h>
    190 -#elif defined (_AIX)
    191 -#include <sys/types.h>
    192 -#elif !defined(ANDROID) && !defined(__OpenBSD__)
    193 -typedef PRInt8 int8_t;
    194 -typedef PRUint8 uint8_t;
    195 -typedef PRInt16 int16_t;
    196 -typedef PRUint16 uint16_t;
    197 -typedef PRInt32 int32_t;
    198 -typedef PRUint32 uint32_t;
    199 -typedef PRInt64 int64_t;
    200 -typedef PRUint64 uint64_t;
    201 -
    202 -#ifdef __OS2__
    203 -/* OS/2's stdlib typdefs uintptr_t. So we'll just include that so we don't collide */
    204 -#include <stdlib.h>
    205 -#elif !defined(__intptr_t_defined) && !defined(_UINTPTR_T_DEFINED)
    206 -typedef PRUptrdiff uintptr_t;
    207 -#endif
    208 -#endif
    209 -
    210 -#else // MOZ_QCMS
    211 -
    212  #if BYTE_ORDER == LITTLE_ENDIAN
    213  #define IS_LITTLE_ENDIAN
    214  #elif BYTE_ORDER == BIG_ENDIAN
    215 @@ -75,7 +44,7 @@ typedef PRUptrdiff uintptr_t;
    216  
    217  #if defined (_SVR4) || defined (SVR4) || defined (__OpenBSD__) || defined (_sgi) || defined (__sun) || defined (sun) || defined (__digital__)
    218  #  include <inttypes.h>
    219 -#elif defined (_MSC_VER)
    220 +#elif defined (_MSC_VER) && _MSC_VER < 1600
    221  typedef __int8 int8_t;
    222  typedef unsigned __int8 uint8_t;
    223  typedef __int16 int16_t;
    224 @@ -87,7 +56,12 @@ typedef unsigned __int64 uint64_t;
    225  #ifdef _WIN64
    226  typedef unsigned __int64 uintptr_t;
    227  #else
    228 +#pragma warning(push)
    229 +/* Disable benign redefinition of type warning 4142 */
    230 +#pragma warning(disable:4142)
    231  typedef unsigned long uintptr_t;
    232 +/* Restore warnings */
    233 +#pragma warning(pop)
    234  #endif
    235  
    236  #elif defined (_AIX)
    237 @@ -96,8 +70,6 @@ typedef unsigned long uintptr_t;
    238  #  include <stdint.h>
    239  #endif
    240  
    241 -#endif
    242 -
    243  typedef qcms_bool bool;
    244  #define true 1
    245  #define false 0
    246 diff --git a/third_party/qcms/src/transform-sse1.c b/third_party/qcms/src/transform-sse1.c
    247 index 2f34db5..aaee1bf 100644
    248 --- a/third_party/qcms/src/transform-sse1.c
    249 +++ b/third_party/qcms/src/transform-sse1.c
    250 @@ -34,7 +34,8 @@ static const ALIGN float clampMaxValueX4[4] =
    251  void qcms_transform_data_rgb_out_lut_sse1(qcms_transform *transform,
    252                                            unsigned char *src,
    253                                            unsigned char *dest,
    254 -                                          size_t length)
    255 +                                          size_t length,
    256 +                                          qcms_format_type output_format)
    257  {
    258      unsigned int i;
    259      float (*mat)[4] = transform->matrix;
    260 @@ -70,6 +71,8 @@ void qcms_transform_data_rgb_out_lut_sse1(qcms_transform *transform,
    261  
    262      /* working variables */
    263      __m128 vec_r, vec_g, vec_b, result;
    264 +    const int r_out = output_format.r;
    265 +    const int b_out = output_format.b;
    266  
    267      /* CYA */
    268      if (!length)
    269 @@ -116,9 +119,9 @@ void qcms_transform_data_rgb_out_lut_sse1(qcms_transform *transform,
    270          src += 3;
    271  
    272          /* use calc'd indices to output RGB values */
    273 -        dest[0] = otdata_r[output[0]];
    274 -        dest[1] = otdata_g[output[1]];
    275 -        dest[2] = otdata_b[output[2]];
    276 +        dest[r_out] = otdata_r[output[0]];
    277 +        dest[1]     = otdata_g[output[1]];
    278 +        dest[b_out] = otdata_b[output[2]];
    279          dest += 3;
    280      }
    281  
    282 @@ -141,9 +144,9 @@ void qcms_transform_data_rgb_out_lut_sse1(qcms_transform *transform,
    283      result = _mm_movehl_ps(result, result);
    284      *((__m64 *)&output[2]) = _mm_cvtps_pi32(result);
    285  
    286 -    dest[0] = otdata_r[output[0]];
    287 -    dest[1] = otdata_g[output[1]];
    288 -    dest[2] = otdata_b[output[2]];
    289 +    dest[r_out] = otdata_r[output[0]];
    290 +    dest[1]     = otdata_g[output[1]];
    291 +    dest[b_out] = otdata_b[output[2]];
    292  
    293      _mm_empty();
    294  }
    295 @@ -151,7 +154,8 @@ void qcms_transform_data_rgb_out_lut_sse1(qcms_transform *transform,
    296  void qcms_transform_data_rgba_out_lut_sse1(qcms_transform *transform,
    297                                             unsigned char *src,
    298                                             unsigned char *dest,
    299 -                                           size_t length)
    300 +                                           size_t length,
    301 +                                           qcms_format_type output_format)
    302  {
    303      unsigned int i;
    304      float (*mat)[4] = transform->matrix;
    305 @@ -187,6 +191,8 @@ void qcms_transform_data_rgba_out_lut_sse1(qcms_transform *transform,
    306  
    307      /* working variables */
    308      __m128 vec_r, vec_g, vec_b, result;
    309 +    const int r_out = output_format.r;
    310 +    const int b_out = output_format.b;
    311      unsigned char alpha;
    312  
    313      /* CYA */
    314 @@ -239,9 +245,9 @@ void qcms_transform_data_rgba_out_lut_sse1(qcms_transform *transform,
    315          src += 4;
    316  
    317          /* use calc'd indices to output RGB values */
    318 -        dest[0] = otdata_r[output[0]];
    319 -        dest[1] = otdata_g[output[1]];
    320 -        dest[2] = otdata_b[output[2]];
    321 +        dest[r_out] = otdata_r[output[0]];
    322 +        dest[1]     = otdata_g[output[1]];
    323 +        dest[b_out] = otdata_b[output[2]];
    324          dest += 4;
    325      }
    326  
    327 @@ -266,9 +272,9 @@ void qcms_transform_data_rgba_out_lut_sse1(qcms_transform *transform,
    328      result = _mm_movehl_ps(result, result);
    329      *((__m64 *)&output[2]) = _mm_cvtps_pi32(result);
    330  
    331 -    dest[0] = otdata_r[output[0]];
    332 -    dest[1] = otdata_g[output[1]];
    333 -    dest[2] = otdata_b[output[2]];
    334 +    dest[r_out] = otdata_r[output[0]];
    335 +    dest[1]     = otdata_g[output[1]];
    336 +    dest[b_out] = otdata_b[output[2]];
    337  
    338      _mm_empty();
    339  }
    340 diff --git a/third_party/qcms/src/transform-sse2.c b/third_party/qcms/src/transform-sse2.c
    341 index 6a5faf9..fa7f2d1 100644
    342 --- a/third_party/qcms/src/transform-sse2.c
    343 +++ b/third_party/qcms/src/transform-sse2.c
    344 @@ -34,7 +34,8 @@ static const ALIGN float clampMaxValueX4[4] =
    345  void qcms_transform_data_rgb_out_lut_sse2(qcms_transform *transform,
    346                                            unsigned char *src,
    347                                            unsigned char *dest,
    348 -                                          size_t length)
    349 +                                          size_t length,
    350 +                                          qcms_format_type output_format)
    351  {
    352      unsigned int i;
    353      float (*mat)[4] = transform->matrix;
    354 @@ -70,6 +71,8 @@ void qcms_transform_data_rgb_out_lut_sse2(qcms_transform *transform,
    355  
    356      /* working variables */
    357      __m128 vec_r, vec_g, vec_b, result;
    358 +    const int r_out = output_format.r;
    359 +    const int b_out = output_format.b;
    360  
    361      /* CYA */
    362      if (!length)
    363 @@ -114,9 +117,9 @@ void qcms_transform_data_rgb_out_lut_sse2(qcms_transform *transform,
    364          src += 3;
    365  
    366          /* use calc'd indices to output RGB values */
    367 -        dest[0] = otdata_r[output[0]];
    368 -        dest[1] = otdata_g[output[1]];
    369 -        dest[2] = otdata_b[output[2]];
    370 +        dest[r_out] = otdata_r[output[0]];
    371 +        dest[1]     = otdata_g[output[1]];
    372 +        dest[b_out] = otdata_b[output[2]];
    373          dest += 3;
    374      }
    375  
    376 @@ -137,15 +140,16 @@ void qcms_transform_data_rgb_out_lut_sse2(qcms_transform *transform,
    377  
    378      _mm_store_si128((__m128i*)output, _mm_cvtps_epi32(result));
    379  
    380 -    dest[0] = otdata_r[output[0]];
    381 -    dest[1] = otdata_g[output[1]];
    382 -    dest[2] = otdata_b[output[2]];
    383 +    dest[r_out] = otdata_r[output[0]];
    384 +    dest[1]     = otdata_g[output[1]];
    385 +    dest[b_out] = otdata_b[output[2]];
    386  }
    387  
    388  void qcms_transform_data_rgba_out_lut_sse2(qcms_transform *transform,
    389                                             unsigned char *src,
    390                                             unsigned char *dest,
    391 -                                           size_t length)
    392 +                                           size_t length,
    393 +                                           qcms_format_type output_format)
    394  {
    395      unsigned int i;
    396      float (*mat)[4] = transform->matrix;
    397 @@ -181,6 +185,8 @@ void qcms_transform_data_rgba_out_lut_sse2(qcms_transform *transform,
    398  
    399      /* working variables */
    400      __m128 vec_r, vec_g, vec_b, result;
    401 +    const int r_out = output_format.r;
    402 +    const int b_out = output_format.b;
    403      unsigned char alpha;
    404  
    405      /* CYA */
    406 @@ -231,9 +237,9 @@ void qcms_transform_data_rgba_out_lut_sse2(qcms_transform *transform,
    407          src += 4;
    408  
    409          /* use calc'd indices to output RGB values */
    410 -        dest[0] = otdata_r[output[0]];
    411 -        dest[1] = otdata_g[output[1]];
    412 -        dest[2] = otdata_b[output[2]];
    413 +        dest[r_out] = otdata_r[output[0]];
    414 +        dest[1]     = otdata_g[output[1]];
    415 +        dest[b_out] = otdata_b[output[2]];
    416          dest += 4;
    417      }
    418  
    419 @@ -256,7 +262,7 @@ void qcms_transform_data_rgba_out_lut_sse2(qcms_transform *transform,
    420  
    421      _mm_store_si128((__m128i*)output, _mm_cvtps_epi32(result));
    422  
    423 -    dest[0] = otdata_r[output[0]];
    424 -    dest[1] = otdata_g[output[1]];
    425 -    dest[2] = otdata_b[output[2]];
    426 +    dest[r_out] = otdata_r[output[0]];
    427 +    dest[1]     = otdata_g[output[1]];
    428 +    dest[b_out] = otdata_b[output[2]];
    429  }
    430 diff --git a/third_party/qcms/src/transform.c b/third_party/qcms/src/transform.c
    431 index 9a6562b..7e0ba2c 100644
    432 --- a/third_party/qcms/src/transform.c
    433 +++ b/third_party/qcms/src/transform.c
    434 @@ -181,11 +181,20 @@ compute_chromatic_adaption(struct CIE_XYZ source_white_point,
    435  static struct matrix
    436  adaption_matrix(struct CIE_XYZ source_illumination, struct CIE_XYZ target_illumination)
    437  {
    438 +#if defined (_MSC_VER)
    439 +#pragma warning(push)
    440 +/* Disable double to float truncation warning 4305 */
    441 +#pragma warning(disable:4305)
    442 +#endif
    443  	struct matrix lam_rigg = {{ // Bradford matrix
    444  	                         {  0.8951,  0.2664, -0.1614 },
    445  	                         { -0.7502,  1.7135,  0.0367 },
    446  	                         {  0.0389, -0.0685,  1.0296 }
    447  	                         }};
    448 +#if defined (_MSC_VER)
    449 +/* Restore warnings */
    450 +#pragma warning(pop)
    451 +#endif
    452  	return compute_chromatic_adaption(source_illumination, target_illumination, lam_rigg);
    453  }
    454  
    455 @@ -230,8 +239,11 @@ qcms_bool set_rgb_colorants(qcms_profile *profile, qcms_CIE_xyY white_point, qcm
    456  }
    457  
    458  #if 0
    459 -static void qcms_transform_data_rgb_out_pow(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    460 +static void qcms_transform_data_rgb_out_pow(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    461  {
    462 +	const int r_out = output_format.r;
    463 +	const int b_out = output_format.b;
    464 +
    465  	int i;
    466  	float (*mat)[4] = transform->matrix;
    467  	for (i=0; i<length; i++) {
    468 @@ -251,15 +263,19 @@ static void qcms_transform_data_rgb_out_pow(qcms_transform *transform, unsigned
    469  		float out_device_g = pow(out_linear_g, transform->out_gamma_g);
    470  		float out_device_b = pow(out_linear_b, transform->out_gamma_b);
    471  
    472 -		*dest++ = clamp_u8(255*out_device_r);
    473 -		*dest++ = clamp_u8(255*out_device_g);
    474 -		*dest++ = clamp_u8(255*out_device_b);
    475 +		dest[r_out] = clamp_u8(out_device_r*255);
    476 +		dest[1]     = clamp_u8(out_device_g*255);
    477 +		dest[b_out] = clamp_u8(out_device_b*255);
    478 +		dest += 3;
    479  	}
    480  }
    481  #endif
    482  
    483 -static void qcms_transform_data_gray_out_lut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    484 +static void qcms_transform_data_gray_out_lut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    485  {
    486 +	const int r_out = output_format.r;
    487 +	const int b_out = output_format.b;
    488 +
    489  	unsigned int i;
    490  	for (i = 0; i < length; i++) {
    491  		float out_device_r, out_device_g, out_device_b;
    492 @@ -267,13 +283,14 @@ static void qcms_transform_data_gray_out_lut(qcms_transform *transform, unsigned
    493  
    494  		float linear = transform->input_gamma_table_gray[device];
    495  
    496 -                out_device_r = lut_interp_linear(linear, transform->output_gamma_lut_r, transform->output_gamma_lut_r_length);
    497 +		out_device_r = lut_interp_linear(linear, transform->output_gamma_lut_r, transform->output_gamma_lut_r_length);
    498  		out_device_g = lut_interp_linear(linear, transform->output_gamma_lut_g, transform->output_gamma_lut_g_length);
    499  		out_device_b = lut_interp_linear(linear, transform->output_gamma_lut_b, transform->output_gamma_lut_b_length);
    500  
    501 -		*dest++ = clamp_u8(out_device_r*255);
    502 -		*dest++ = clamp_u8(out_device_g*255);
    503 -		*dest++ = clamp_u8(out_device_b*255);
    504 +		dest[r_out] = clamp_u8(out_device_r*255);
    505 +		dest[1]     = clamp_u8(out_device_g*255);
    506 +		dest[b_out] = clamp_u8(out_device_b*255);
    507 +		dest += 3;
    508  	}
    509  }
    510  
    511 @@ -283,8 +300,11 @@ static void qcms_transform_data_gray_out_lut(qcms_transform *transform, unsigned
    512  	See: ftp://ftp.alvyray.com/Acrobat/17_Nonln.pdf
    513  */
    514  
    515 -static void qcms_transform_data_graya_out_lut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    516 +static void qcms_transform_data_graya_out_lut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    517  {
    518 +	const int r_out = output_format.r;
    519 +	const int b_out = output_format.b;
    520 +
    521  	unsigned int i;
    522  	for (i = 0; i < length; i++) {
    523  		float out_device_r, out_device_g, out_device_b;
    524 @@ -293,20 +313,24 @@ static void qcms_transform_data_graya_out_lut(qcms_transform *transform, unsigne
    525  
    526  		float linear = transform->input_gamma_table_gray[device];
    527  
    528 -                out_device_r = lut_interp_linear(linear, transform->output_gamma_lut_r, transform->output_gamma_lut_r_length);
    529 +		out_device_r = lut_interp_linear(linear, transform->output_gamma_lut_r, transform->output_gamma_lut_r_length);
    530  		out_device_g = lut_interp_linear(linear, transform->output_gamma_lut_g, transform->output_gamma_lut_g_length);
    531  		out_device_b = lut_interp_linear(linear, transform->output_gamma_lut_b, transform->output_gamma_lut_b_length);
    532  
    533 -		*dest++ = clamp_u8(out_device_r*255);
    534 -		*dest++ = clamp_u8(out_device_g*255);
    535 -		*dest++ = clamp_u8(out_device_b*255);
    536 -		*dest++ = alpha;
    537 +		dest[r_out] = clamp_u8(out_device_r*255);
    538 +		dest[1]     = clamp_u8(out_device_g*255);
    539 +		dest[b_out] = clamp_u8(out_device_b*255);
    540 +		dest[3]     = alpha;
    541 +		dest += 4;
    542  	}
    543  }
    544  
    545  
    546 -static void qcms_transform_data_gray_out_precache(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    547 +static void qcms_transform_data_gray_out_precache(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    548  {
    549 +	const int r_out = output_format.r;
    550 +	const int b_out = output_format.b;
    551 +
    552  	unsigned int i;
    553  	for (i = 0; i < length; i++) {
    554  		unsigned char device = *src++;
    555 @@ -317,14 +341,19 @@ static void qcms_transform_data_gray_out_precache(qcms_transform *transform, uns
    556  		/* we could round here... */
    557  		gray = linear * PRECACHE_OUTPUT_MAX;
    558  
    559 -		*dest++ = transform->output_table_r->data[gray];
    560 -		*dest++ = transform->output_table_g->data[gray];
    561 -		*dest++ = transform->output_table_b->data[gray];
    562 +		dest[r_out] = transform->output_table_r->data[gray];
    563 +		dest[1]     = transform->output_table_g->data[gray];
    564 +		dest[b_out] = transform->output_table_b->data[gray];
    565 +		dest += 3;
    566  	}
    567  }
    568  
    569 -static void qcms_transform_data_graya_out_precache(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    570 +
    571 +static void qcms_transform_data_graya_out_precache(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    572  {
    573 +	const int r_out = output_format.r;
    574 +	const int b_out = output_format.b;
    575 +
    576  	unsigned int i;
    577  	for (i = 0; i < length; i++) {
    578  		unsigned char device = *src++;
    579 @@ -336,15 +365,19 @@ static void qcms_transform_data_graya_out_precache(qcms_transform *transform, un
    580  		/* we could round here... */
    581  		gray = linear * PRECACHE_OUTPUT_MAX;
    582  
    583 -		*dest++ = transform->output_table_r->data[gray];
    584 -		*dest++ = transform->output_table_g->data[gray];
    585 -		*dest++ = transform->output_table_b->data[gray];
    586 -		*dest++ = alpha;
    587 +		dest[r_out] = transform->output_table_r->data[gray];
    588 +		dest[1]     = transform->output_table_g->data[gray];
    589 +		dest[b_out] = transform->output_table_b->data[gray];
    590 +		dest[3]     = alpha;
    591 +		dest += 4;
    592  	}
    593  }
    594  
    595 -static void qcms_transform_data_rgb_out_lut_precache(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    596 +static void qcms_transform_data_rgb_out_lut_precache(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    597  {
    598 +	const int r_out = output_format.r;
    599 +	const int b_out = output_format.b;
    600 +
    601  	unsigned int i;
    602  	float (*mat)[4] = transform->matrix;
    603  	for (i = 0; i < length; i++) {
    604 @@ -370,14 +403,18 @@ static void qcms_transform_data_rgb_out_lut_precache(qcms_transform *transform,
    605  		g = out_linear_g * PRECACHE_OUTPUT_MAX;
    606  		b = out_linear_b * PRECACHE_OUTPUT_MAX;
    607  
    608 -		*dest++ = transform->output_table_r->data[r];
    609 -		*dest++ = transform->output_table_g->data[g];
    610 -		*dest++ = transform->output_table_b->data[b];
    611 +		dest[r_out] = transform->output_table_r->data[r];
    612 +		dest[1]     = transform->output_table_g->data[g];
    613 +		dest[b_out] = transform->output_table_b->data[b];
    614 +		dest += 3;
    615  	}
    616  }
    617  
    618 -static void qcms_transform_data_rgba_out_lut_precache(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    619 +static void qcms_transform_data_rgba_out_lut_precache(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    620  {
    621 +	const int r_out = output_format.r;
    622 +	const int b_out = output_format.b;
    623 +
    624  	unsigned int i;
    625  	float (*mat)[4] = transform->matrix;
    626  	for (i = 0; i < length; i++) {
    627 @@ -404,16 +441,21 @@ static void qcms_transform_data_rgba_out_lut_precache(qcms_transform *transform,
    628  		g = out_linear_g * PRECACHE_OUTPUT_MAX;
    629  		b = out_linear_b * PRECACHE_OUTPUT_MAX;
    630  
    631 -		*dest++ = transform->output_table_r->data[r];
    632 -		*dest++ = transform->output_table_g->data[g];
    633 -		*dest++ = transform->output_table_b->data[b];
    634 -		*dest++ = alpha;
    635 +		dest[r_out] = transform->output_table_r->data[r];
    636 +		dest[1]     = transform->output_table_g->data[g];
    637 +		dest[b_out] = transform->output_table_b->data[b];
    638 +		dest[3]     = alpha;
    639 +		dest += 4;
    640  	}
    641  }
    642  
    643  // Not used
    644  /* 
    645 -static void qcms_transform_data_clut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length) {
    646 +static void qcms_transform_data_clut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    647 +{
    648 +	const int r_out = output_format.r;
    649 +	const int b_out = output_format.b;
    650 +
    651  	unsigned int i;
    652  	int xy_len = 1;
    653  	int x_len = transform->grid_size;
    654 @@ -462,15 +504,20 @@ static void qcms_transform_data_clut(qcms_transform *transform, unsigned char *s
    655  		float b_y2 = lerp(b_x3, b_x4, y_d);
    656  		float clut_b = lerp(b_y1, b_y2, z_d);
    657  
    658 -		*dest++ = clamp_u8(clut_r*255.0f);
    659 -		*dest++ = clamp_u8(clut_g*255.0f);
    660 -		*dest++ = clamp_u8(clut_b*255.0f);
    661 -	}	
    662 +		dest[r_out] = clamp_u8(clut_r*255.0f);
    663 +		dest[1]     = clamp_u8(clut_g*255.0f);
    664 +		dest[b_out] = clamp_u8(clut_b*255.0f);
    665 +		dest += 3;
    666 +	}
    667  }
    668  */
    669  
    670  // Using lcms' tetra interpolation algorithm.
    671 -static void qcms_transform_data_tetra_clut_rgba(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length) {
    672 +static void qcms_transform_data_tetra_clut_rgba(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    673 +{
    674 +	const int r_out = output_format.r;
    675 +	const int b_out = output_format.b;
    676 +
    677  	unsigned int i;
    678  	int xy_len = 1;
    679  	int x_len = transform->grid_size;
    680 @@ -577,15 +624,20 @@ static void qcms_transform_data_tetra_clut_rgba(qcms_transform *transform, unsig
    681  		clut_g = c0_g + c1_g*rx + c2_g*ry + c3_g*rz;
    682  		clut_b = c0_b + c1_b*rx + c2_b*ry + c3_b*rz;
    683  
    684 -		*dest++ = clamp_u8(clut_r*255.0f);
    685 -		*dest++ = clamp_u8(clut_g*255.0f);
    686 -		*dest++ = clamp_u8(clut_b*255.0f);
    687 -		*dest++ = in_a;
    688 -	}	
    689 +		dest[r_out] = clamp_u8(clut_r*255.0f);
    690 +		dest[1]     = clamp_u8(clut_g*255.0f);
    691 +		dest[b_out] = clamp_u8(clut_b*255.0f);
    692 +		dest[3]     = in_a;
    693 +		dest += 4;
    694 +	}
    695  }
    696  
    697  // Using lcms' tetra interpolation code.
    698 -static void qcms_transform_data_tetra_clut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length) {
    699 +static void qcms_transform_data_tetra_clut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    700 +{
    701 +	const int r_out = output_format.r;
    702 +	const int b_out = output_format.b;
    703 +
    704  	unsigned int i;
    705  	int xy_len = 1;
    706  	int x_len = transform->grid_size;
    707 @@ -691,14 +743,18 @@ static void qcms_transform_data_tetra_clut(qcms_transform *transform, unsigned c
    708  		clut_g = c0_g + c1_g*rx + c2_g*ry + c3_g*rz;
    709  		clut_b = c0_b + c1_b*rx + c2_b*ry + c3_b*rz;
    710  
    711 -		*dest++ = clamp_u8(clut_r*255.0f);
    712 -		*dest++ = clamp_u8(clut_g*255.0f);
    713 -		*dest++ = clamp_u8(clut_b*255.0f);
    714 -	}	
    715 +		dest[r_out] = clamp_u8(clut_r*255.0f);
    716 +		dest[1]     = clamp_u8(clut_g*255.0f);
    717 +		dest[b_out] = clamp_u8(clut_b*255.0f);
    718 +		dest += 3;
    719 +	}
    720  }
    721  
    722 -static void qcms_transform_data_rgb_out_lut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    723 +static void qcms_transform_data_rgb_out_lut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    724  {
    725 +	const int r_out = output_format.r;
    726 +	const int b_out = output_format.b;
    727 +
    728  	unsigned int i;
    729  	float (*mat)[4] = transform->matrix;
    730  	for (i = 0; i < length; i++) {
    731 @@ -726,14 +782,18 @@ static void qcms_transform_data_rgb_out_lut(qcms_transform *transform, unsigned
    732  		out_device_b = lut_interp_linear(out_linear_b, 
    733  				transform->output_gamma_lut_b, transform->output_gamma_lut_b_length);
    734  
    735 -		*dest++ = clamp_u8(out_device_r*255);
    736 -		*dest++ = clamp_u8(out_device_g*255);
    737 -		*dest++ = clamp_u8(out_device_b*255);
    738 +		dest[r_out] = clamp_u8(out_device_r*255);
    739 +		dest[1]     = clamp_u8(out_device_g*255);
    740 +		dest[b_out] = clamp_u8(out_device_b*255);
    741 +		dest += 3;
    742  	}
    743  }
    744  
    745 -static void qcms_transform_data_rgba_out_lut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    746 +static void qcms_transform_data_rgba_out_lut(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    747  {
    748 +	const int r_out = output_format.r;
    749 +	const int b_out = output_format.b;
    750 +
    751  	unsigned int i;
    752  	float (*mat)[4] = transform->matrix;
    753  	for (i = 0; i < length; i++) {
    754 @@ -762,16 +822,20 @@ static void qcms_transform_data_rgba_out_lut(qcms_transform *transform, unsigned
    755  		out_device_b = lut_interp_linear(out_linear_b, 
    756  				transform->output_gamma_lut_b, transform->output_gamma_lut_b_length);
    757  
    758 -		*dest++ = clamp_u8(out_device_r*255);
    759 -		*dest++ = clamp_u8(out_device_g*255);
    760 -		*dest++ = clamp_u8(out_device_b*255);
    761 -		*dest++ = alpha;
    762 +		dest[r_out] = clamp_u8(out_device_r*255);
    763 +		dest[1]     = clamp_u8(out_device_g*255);
    764 +		dest[b_out] = clamp_u8(out_device_b*255);
    765 +		dest[3]     = alpha;
    766 +		dest += 4;
    767  	}
    768  }
    769  
    770  #if 0
    771 -static void qcms_transform_data_rgb_out_linear(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length)
    772 +static void qcms_transform_data_rgb_out_linear(qcms_transform *transform, unsigned char *src, unsigned char *dest, size_t length, qcms_format_type output_format)
    773  {
    774 +	const int r_out = output_format.r;
    775 +	const int b_out = output_format.b;
    776 +
    777  	int i;
    778  	float (*mat)[4] = transform->matrix;
    779  	for (i = 0; i < length; i++) {
    780 @@ -787,16 +851,25 @@ static void qcms_transform_data_rgb_out_linear(qcms_transform *transform, unsign
    781  		float out_linear_g = mat[0][1]*linear_r + mat[1][1]*linear_g + mat[2][1]*linear_b;
    782  		float out_linear_b = mat[0][2]*linear_r + mat[1][2]*linear_g + mat[2][2]*linear_b;
    783  
    784 -		*dest++ = clamp_u8(out_linear_r*255);
    785 -		*dest++ = clamp_u8(out_linear_g*255);
    786 -		*dest++ = clamp_u8(out_linear_b*255);
    787 +		dest[r_out] = clamp_u8(out_linear_r*255);
    788 +		dest[1]     = clamp_u8(out_linear_g*255);
    789 +		dest[b_out] = clamp_u8(out_linear_b*255);
    790 +		dest += 3;
    791  	}
    792  }
    793  #endif
    794  
    795 +/*
    796 + * If users create and destroy objects on different threads, even if the same
    797 + * objects aren't used on different threads at the same time, we can still run
    798 + * in to trouble with refcounts if they aren't atomic.
    799 + *
    800 + * This can lead to us prematurely deleting the precache if threads get unlucky
    801 + * and write the wrong value to the ref count.
    802 + */
    803  static struct precache_output *precache_reference(struct precache_output *p)
    804  {
    805 -	p->ref_count++;
    806 +	qcms_atomic_increment(p->ref_count);
    807  	return p;
    808  }
    809  
    810 @@ -810,12 +883,12 @@ static struct precache_output *precache_create()
    811  
    812  void precache_release(struct precache_output *p)
    813  {
    814 -	if (--p->ref_count == 0) {
    815 +	if (qcms_atomic_decrement(p->ref_count) == 0) {
    816  		free(p);
    817  	}
    818  }
    819  
    820 -#ifdef HAS_POSIX_MEMALIGN
    821 +#ifdef HAVE_POSIX_MEMALIGN
    822  static qcms_transform *transform_alloc(void)
    823  {
    824  	qcms_transform *t;
    825 @@ -994,13 +1067,15 @@ void qcms_profile_precache_output_transform(qcms_profile *profile)
    826  	if (profile->color_space != RGB_SIGNATURE)
    827  		return;
    828  
    829 -	/* don't precache since we will use the B2A LUT */
    830 -	if (profile->B2A0)
    831 -		return;
    832 +	if (qcms_supports_iccv4) {
    833 +		/* don't precache since we will use the B2A LUT */
    834 +		if (profile->B2A0)
    835 +			return;
    836  
    837 -	/* don't precache since we will use the mBA LUT */
    838 -	if (profile->mBA)
    839 -		return;
    840 +		/* don't precache since we will use the mBA LUT */
    841 +		if (profile->mBA)
    842 +			return;
    843 +	}
    844  
    845  	/* don't precache if we do not have the TRC curves */
    846  	if (!profile->redTRC || !profile->greenTRC || !profile->blueTRC)
    847 @@ -1157,14 +1232,14 @@ qcms_transform* qcms_transform_create(
    848                  	return NULL;
    849              	}
    850  		if (precache) {
    851 -#ifdef X86
    852 +#if defined(SSE2_ENABLE) && defined(X86)
    853  		    if (sse_version_available() >= 2) {
    854  			    if (in_type == QCMS_DATA_RGB_8)
    855  				    transform->transform_fn = qcms_transform_data_rgb_out_lut_sse2;
    856  			    else
    857  				    transform->transform_fn = qcms_transform_data_rgba_out_lut_sse2;
    858  
    859 -#if !(defined(_MSC_VER) && defined(_M_AMD64))
    860 +#if defined(SSE2_ENABLE) && !(defined(_MSC_VER) && defined(_M_AMD64))
    861                      /* Microsoft Compiler for x64 doesn't support MMX.
    862                       * SSE code uses MMX so that we disable on x64 */
    863  		    } else
    864 @@ -1256,13 +1331,34 @@ qcms_transform* qcms_transform_create(
    865  	return transform;
    866  }
    867  
    868 -#if defined(__GNUC__) && !defined(__x86_64__) && !defined(__amd64__)
    869 +/* __force_align_arg_pointer__ is an x86-only attribute, and gcc/clang warns on unused
    870 + * attributes. Don't use this on ARM or AMD64. __has_attribute can detect the presence
    871 + * of the attribute but is currently only supported by clang */
    872 +#if defined(__has_attribute)
    873 +#define HAS_FORCE_ALIGN_ARG_POINTER __has_attribute(__force_align_arg_pointer__)
    874 +#elif defined(__GNUC__) && !defined(__x86_64__) && !defined(__amd64__) && !defined(__arm__) && !defined(__mips__)
    875 +#define HAS_FORCE_ALIGN_ARG_POINTER 1
    876 +#else
    877 +#define HAS_FORCE_ALIGN_ARG_POINTER 0
    878 +#endif
    879 +
    880 +#if HAS_FORCE_ALIGN_ARG_POINTER
    881  /* we need this to avoid crashes when gcc assumes the stack is 128bit aligned */
    882  __attribute__((__force_align_arg_pointer__))
    883  #endif
    884  void qcms_transform_data(qcms_transform *transform, void *src, void *dest, size_t length)
    885  {
    886 -	transform->transform_fn(transform, src, dest, length);
    887 +	static const struct _qcms_format_type output_rgbx = { 0, 2 };
    888 +
    889 +	transform->transform_fn(transform, src, dest, length, output_rgbx);
    890 +}
    891 +
    892 +void qcms_transform_data_type(qcms_transform *transform, void *src, void *dest, size_t length, qcms_output_type type)
    893 +{
    894 +	static const struct _qcms_format_type output_rgbx = { 0, 2 };
    895 +	static const struct _qcms_format_type output_bgrx = { 2, 0 };
    896 +
    897 +	transform->transform_fn(transform, src, dest, length, type == QCMS_OUTPUT_BGRX ? output_bgrx : output_rgbx);
    898  }
    899  
    900  qcms_bool qcms_supports_iccv4;
    901 diff --git a/third_party/qcms/src/transform_util.c b/third_party/qcms/src/transform_util.c
    902 index e8447e5..f4338b2 100644
    903 --- a/third_party/qcms/src/transform_util.c
    904 +++ b/third_party/qcms/src/transform_util.c
    905 @@ -36,7 +36,7 @@
    906  
    907  /* value must be a value between 0 and 1 */
    908  //XXX: is the above a good restriction to have?
    909 -float lut_interp_linear(double value, uint16_t *table, int length)
    910 +float lut_interp_linear(double value, uint16_t *table, size_t length)
    911  {
    912  	int upper, lower;
    913  	value = value * (length - 1); // scale to length of the array
    914 @@ -49,11 +49,11 @@ float lut_interp_linear(double value, uint16_t *table, int length)
    915  }
    916  
    917  /* same as above but takes and returns a uint16_t value representing a range from 0..1 */
    918 -uint16_t lut_interp_linear16(uint16_t input_value, uint16_t *table, int length)
    919 +uint16_t lut_interp_linear16(uint16_t input_value, uint16_t *table, size_t length)
    920  {
    921  	/* Start scaling input_value to the length of the array: 65535*(length-1).
    922  	 * We'll divide out the 65535 next */
    923 -	uint32_t value = (input_value * (length - 1));
    924 +	uintptr_t value = (input_value * (length - 1));
    925  	uint32_t upper = (value + 65534) / 65535; /* equivalent to ceil(value/65535) */
    926  	uint32_t lower = value / 65535;           /* equivalent to floor(value/65535) */
    927  	/* interp is the distance from upper to value scaled to 0..65535 */
    928 @@ -67,11 +67,11 @@ uint16_t lut_interp_linear16(uint16_t input_value, uint16_t *table, int length)
    929  /* same as above but takes an input_value from 0..PRECACHE_OUTPUT_MAX
    930   * and returns a uint8_t value representing a range from 0..1 */
    931  static
    932 -uint8_t lut_interp_linear_precache_output(uint32_t input_value, uint16_t *table, int length)
    933 +uint8_t lut_interp_linear_precache_output(uint32_t input_value, uint16_t *table, size_t length)
    934  {
    935  	/* Start scaling input_value to the length of the array: PRECACHE_OUTPUT_MAX*(length-1).
    936  	 * We'll divide out the PRECACHE_OUTPUT_MAX next */
    937 -	uint32_t value = (input_value * (length - 1));
    938 +	uintptr_t value = (input_value * (length - 1));
    939  
    940  	/* equivalent to ceil(value/PRECACHE_OUTPUT_MAX) */
    941  	uint32_t upper = (value + PRECACHE_OUTPUT_MAX-1) / PRECACHE_OUTPUT_MAX;
    942 @@ -91,7 +91,7 @@ uint8_t lut_interp_linear_precache_output(uint32_t input_value, uint16_t *table,
    943  
    944  /* value must be a value between 0 and 1 */
    945  //XXX: is the above a good restriction to have?
    946 -float lut_interp_linear_float(float value, float *table, int length)
    947 +float lut_interp_linear_float(float value, float *table, size_t length)
    948  {
    949          int upper, lower;
    950          value = value * (length - 1);
    951 @@ -235,6 +235,21 @@ float u8Fixed8Number_to_float(uint16_t x)
    952  	return x/256.;
    953  }
    954  
    955 +/* The SSE2 code uses min & max which let NaNs pass through.
    956 +   We want to try to prevent that here by ensuring that
    957 +   gamma table is within expected values. */
    958 +void validate_gamma_table(float gamma_table[256])
    959 +{
    960 +	int i;
    961 +	for (i = 0; i < 256; i++) {
    962 +		// Note: we check that the gamma is not in range
    963 +		// instead of out of range so that we catch NaNs
    964 +		if (!(gamma_table[i] >= 0.f && gamma_table[i] <= 1.f)) {
    965 +			gamma_table[i] = 0.f;
    966 +		}
    967 +	}
    968 +}
    969 +
    970  float *build_input_gamma_table(struct curveType *TRC)
    971  {
    972  	float *gamma_table;
    973 @@ -254,7 +269,10 @@ float *build_input_gamma_table(struct curveType *TRC)
    974  			}
    975  		}
    976  	}
    977 -        return gamma_table;
    978 +
    979 +	validate_gamma_table(gamma_table);
    980 +
    981 +	return gamma_table;
    982  }
    983  
    984  struct matrix build_colorant_matrix(qcms_profile *p)
    985 @@ -390,7 +408,7 @@ uint16_fract_t lut_inverse_interp16(uint16_t Value, uint16_t LutTable[], int len
    986   which has an maximum error of about 9855 (pixel difference of ~38.346)
    987  
    988   For now, we punt the decision of output size to the caller. */
    989 -static uint16_t *invert_lut(uint16_t *table, int length, int out_length)
    990 +static uint16_t *invert_lut(uint16_t *table, int length, size_t out_length)
    991  {
    992          int i;
    993          /* for now we invert the lut by creating a lut of size out_length
    994 diff --git a/third_party/qcms/src/transform_util.h b/third_party/qcms/src/transform_util.h
    995 index 8f358a8..de465f4 100644
    996 --- a/third_party/qcms/src/transform_util.h
    997 +++ b/third_party/qcms/src/transform_util.h
    998 @@ -31,9 +31,9 @@
    999  //XXX: could use a bettername
   1000  typedef uint16_t uint16_fract_t;
   1001  
   1002 -float lut_interp_linear(double value, uint16_t *table, int length);
   1003 -float lut_interp_linear_float(float value, float *table, int length);
   1004 -uint16_t lut_interp_linear16(uint16_t input_value, uint16_t *table, int length);
   1005 +float lut_interp_linear(double value, uint16_t *table, size_t length);
   1006 +float lut_interp_linear_float(float value, float *table, size_t length);
   1007 +uint16_t lut_interp_linear16(uint16_t input_value, uint16_t *table, size_t length);
   1008  
   1009  
   1010  static inline float lerp(float a, float b, float t)
   1011