Chromium Code Reviews| Index: gm/rebaseline_server/imagediffdb.py |
| =================================================================== |
| --- gm/rebaseline_server/imagediffdb.py (revision 12361) |
| +++ gm/rebaseline_server/imagediffdb.py (working copy) |
| @@ -21,14 +21,14 @@ |
| + 'http://www.pythonware.com/products/pil/') |
| IMAGE_SUFFIX = '.png' |
| -IMAGE_FORMAT = 'PNG' # must match one of the PIL image formats, listed at |
| - # http://effbot.org/imagingbook/formats.htm |
| IMAGES_SUBDIR = 'images' |
| DIFFS_SUBDIR = 'diffs' |
| WHITEDIFFS_SUBDIR = 'whitediffs' |
| +VALUES_PER_BAND = 256 |
| + |
| class DiffRecord(object): |
| """ Record of differences between two images. """ |
| @@ -65,33 +65,43 @@ |
| str(actual_image_locator) + IMAGE_SUFFIX), |
| actual_image_url) |
| - # Store the diff image (absolute diff at each pixel). |
| + # Generate the diff image (absolute diff at each pixel) and |
| + # max_diff_per_channel. |
| diff_image = _generate_image_diff(actual_image, expected_image) |
| - self._weighted_diff_measure = _calculate_weighted_diff_metric(diff_image) |
| + diff_histogram = diff_image.histogram() |
| + (diff_width, diff_height) = diff_image.size |
| + self._weighted_diff_measure = _calculate_weighted_diff_metric( |
| + diff_histogram, diff_width * diff_height) |
| + self._max_diff_per_channel = _max_per_band(diff_histogram) |
| + |
| + # Generate the whitediff image (any differing pixels show as white). |
| + # This is tricky, because when you convert color images to grayscale or |
| + # black & white in PIL, it has its own ideas about thresholds. |
| + # We have to force it: if a pixel has any color at all, it's a '1'. |
| + bands = diff_image.split() |
| + graydiff_image = ImageChops.lighter(ImageChops.lighter( |
| + bands[0], bands[1]), bands[2]) |
| + whitediff_image = (graydiff_image.point(lambda p: p > 0 and VALUES_PER_BAND) |
| + .convert('1', dither=Image.NONE)) |
| + |
| + # Final touches on diff_image: use whitediff_image as an alpha mask. |
| + # Unchanged pixels are transparent; differing pixels are opaque. |
| + diff_image.putalpha(whitediff_image) |
| + |
| + # Store the diff and whitediff images generated above. |
| diff_image_locator = _get_difference_locator( |
| expected_image_locator=expected_image_locator, |
| actual_image_locator=actual_image_locator) |
| - diff_image_filepath = os.path.join( |
| - storage_root, DIFFS_SUBDIR, str(diff_image_locator) + IMAGE_SUFFIX) |
| - _mkdir_unless_exists(os.path.join(storage_root, DIFFS_SUBDIR)) |
| - diff_image.save(diff_image_filepath, IMAGE_FORMAT) |
| + basename = str(diff_image_locator) + IMAGE_SUFFIX |
| + _save_image(diff_image, os.path.join( |
| + storage_root, DIFFS_SUBDIR, basename)) |
| + _save_image(whitediff_image, os.path.join( |
| + storage_root, WHITEDIFFS_SUBDIR, basename)) |
| - # Store the whitediff image (any differing pixels show as white). |
| - # |
| - # TODO(epoger): From http://effbot.org/imagingbook/image.htm , it seems |
| - # like we should be able to use im.point(function, mode) to perform both |
| - # the point() and convert('1') operations simultaneously, but I couldn't |
| - # get it to work. |
| - whitediff_image = (diff_image.point(lambda p: (0, 256)[p!=0]) |
| - .convert('1')) |
| - whitediff_image_filepath = os.path.join( |
| - storage_root, WHITEDIFFS_SUBDIR, str(diff_image_locator) + IMAGE_SUFFIX) |
| - _mkdir_unless_exists(os.path.join(storage_root, WHITEDIFFS_SUBDIR)) |
| - whitediff_image.save(whitediff_image_filepath, IMAGE_FORMAT) |
| - |
| # Calculate difference metrics. |
| (self._width, self._height) = diff_image.size |
| - self._num_pixels_differing = whitediff_image.histogram()[255] |
| + self._num_pixels_differing = ( |
| + whitediff_image.histogram()[VALUES_PER_BAND - 1]) |
| def get_num_pixels_differing(self): |
| """Returns the absolute number of pixels that differ.""" |
| @@ -108,7 +118,12 @@ |
| (inclusive).""" |
| return self._weighted_diff_measure |
| + def get_max_diff_per_channel(self): |
| + """Returns the maximum difference between the expected and actual images |
| + for each R/G/B channel, as a list.""" |
| + return self._max_diff_per_channel |
| + |
| class ImageDiffDB(object): |
| """ Calculates differences between image pairs, maintaining a database of |
| them for download.""" |
| @@ -175,27 +190,53 @@ |
| # Utility functions |
| -def _calculate_weighted_diff_metric(image): |
| - """Given a diff image (per-channel diff at each pixel between two images), |
| - calculate the weighted diff metric (a stab at how different the two images |
| - really are). |
| +def _calculate_weighted_diff_metric(histogram, num_pixels): |
| + """Given the histogram of a diff image (per-channel diff at each |
| + pixel between two images), calculate the weighted diff metric (a |
| + stab at how different the two images really are). |
| Args: |
| - image: PIL image; a per-channel diff between two images |
| + histogram: PIL histogram of a per-channel diff between two images |
| + num_pixels: integer; the total number of pixels in the diff image |
| Returns: a weighted diff metric, as a float between 0 and 100 (inclusive). |
| """ |
| # TODO(epoger): This is just a wild guess at an appropriate metric. |
| # In the long term, we will probably use some metric generated by |
| # skpdiff anyway. |
| - (width, height) = image.size |
| - maxdiff = 3 * (width * height) * 255**2 |
| - h = image.histogram() |
| - assert(len(h) % 256 == 0) |
| - totaldiff = sum(map(lambda index,value: value * (index%256)**2, |
| - range(len(h)), h)) |
| - return float(100 * totaldiff) / maxdiff |
| + assert(len(histogram) % VALUES_PER_BAND == 0) |
| + num_bands = len(histogram) / VALUES_PER_BAND |
| + max_diff = num_pixels * num_bands * (VALUES_PER_BAND - 1)**2 |
| + total_diff = sum(map(lambda index,value: value * (index % VALUES_PER_BAND)**2, |
|
mtklein
2013/11/22 18:47:34
I think this expression may have tipped over into
epoger
2013/11/22 19:05:18
I completely agree. I was just trying to be one o
|
| + xrange(len(histogram)), histogram)) |
| + return float(100 * total_diff) / max_diff |
| +def _max_per_band(histogram): |
| + """Given the histogram of an image, return the maximum value of each band |
| + (a.k.a. "color channel", such as R/G/B) across the entire image. |
| + |
| + Args: |
| + histogram: PIL histogram |
| + |
| + Returns the maximum value of each band within the image histogram, as a list. |
| + """ |
| + max_per_band = [] |
| + assert(len(histogram) % VALUES_PER_BAND == 0) |
| + num_bands = len(histogram) / VALUES_PER_BAND |
| + for band in xrange(num_bands): |
| + # Assuming that VALUES_PER_BAND is 256... |
| + # the 'R' band makes up indices 0-255 in the histogram, |
| + # the 'G' band makes up indices 256-511 in the histogram, |
| + # etc. |
| + min_index = band * VALUES_PER_BAND |
| + index = min_index + VALUES_PER_BAND |
| + while index > min_index: |
| + index -= 1 |
| + if histogram[index] > 0: |
| + max_per_band.append(index - min_index) |
| + break |
| + return max_per_band |
| + |
| def _generate_image_diff(image1, image2): |
| """Wrapper for ImageChops.difference(image1, image2) that will handle some |
| errors automatically, or at least yield more useful error messages. |
| @@ -248,6 +289,18 @@ |
| logging.error('IOError loading image file %s' % filepath) |
| raise |
| +def _save_image(image, filepath, format='PNG'): |
| + """Write an image to disk, creating any intermediate directories as needed. |
| + |
| + Args: |
| + image: a PIL image object |
| + filepath: path on local disk to write image to |
| + format: one of the PIL image formats, listed at |
| + http://effbot.org/imagingbook/formats.htm |
| + """ |
| + _mkdir_unless_exists(os.path.dirname(filepath)) |
| + image.save(filepath, format) |
| + |
| def _mkdir_unless_exists(path): |
| """Unless path refers to an already-existing directory, create it. |