gm/rebaseline_server/imagediffdb.py - Issue 325413003: rebaseline_server: use just skpdiff, not Python Image Library

Unified Diff: gm/rebaseline_server/imagediffdb.py

Issue 325413003: rebaseline_server: use just skpdiff, not Python Image Library (Closed) Base URL: https://skia.googlesource.com/skia.git@master

Patch Set: attempt to fix "'abs' : ambiguous call to overloaded function" on Windows Created 6 years, 6 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: gm/rebaseline_server/imagediffdb.py

diff --git a/gm/rebaseline_server/imagediffdb.py b/gm/rebaseline_server/imagediffdb.py

index 6b684143b03f256a6a4eee87d43447eabfe713f8..985017af1c28b862525957588df4e8482ca10541 100644

--- a/gm/rebaseline_server/imagediffdb.py

+++ b/gm/rebaseline_server/imagediffdb.py

@@ -10,7 +10,7 @@ Calulate differences between image pairs, and store them in a database.

"""

import contextlib

-import csv

+import json

import logging

import os

import re

@@ -18,11 +18,6 @@ import shutil

import sys

import tempfile

import urllib

-try:

- from PIL import Image, ImageChops

-except ImportError:

- raise ImportError('Requires PIL to be installed; see '

- + 'http://www.pythonware.com/products/pil/')

# Set the PYTHONPATH to include the tools directory.

sys.path.append(

@@ -38,11 +33,9 @@ DEFAULT_IMAGES_SUBDIR = 'images'

DISALLOWED_FILEPATH_CHAR_REGEX = re.compile('[^\w\-]')

-DIFFS_SUBDIR = 'diffs'

+RGBDIFFS_SUBDIR = 'diffs'

WHITEDIFFS_SUBDIR = 'whitediffs'

-VALUES_PER_BAND = 256

# Keys used within DiffRecord dictionary representations.

# NOTE: Keep these in sync with static/constants.js

KEY__DIFFERENCES__MAX_DIFF_PER_CHANNEL = 'maxDiffPerChannel'

@@ -87,9 +80,8 @@ class DiffRecord(object):

actual_image_locator = _sanitize_locator(actual_image_locator)

# Download the expected/actual images, if we don't have them already.

- # TODO(rmistry): Add a parameter that makes _download_and_open_image raise

- # an exception if images are not found locally (instead of trying to

- # download them).

+ # TODO(rmistry): Add a parameter that just tries to use already-present

+ # image files rather than downloading them.

expected_image_file = os.path.join(

storage_root, expected_images_subdir,

str(expected_image_locator) + image_suffix)

@@ -97,80 +89,91 @@ class DiffRecord(object):

storage_root, actual_images_subdir,

str(actual_image_locator) + image_suffix)

try:

- expected_image = _download_and_open_image(

- expected_image_file, expected_image_url)

+ _download_file(expected_image_file, expected_image_url)

except Exception:

logging.exception('unable to download expected_image_url %s to file %s' %

(expected_image_url, expected_image_file))

raise

try:

- actual_image = _download_and_open_image(

- actual_image_file, actual_image_url)

+ _download_file(actual_image_file, actual_image_url)

except Exception:

logging.exception('unable to download actual_image_url %s to file %s' %

(actual_image_url, actual_image_file))

raise

- # Generate the diff image (absolute diff at each pixel) and

- # max_diff_per_channel.

- diff_image = _generate_image_diff(actual_image, expected_image)

- diff_histogram = diff_image.histogram()

- (diff_width, diff_height) = diff_image.size

- self._max_diff_per_channel = _max_per_band(diff_histogram)

- # Generate the whitediff image (any differing pixels show as white).

- # This is tricky, because when you convert color images to grayscale or

- # black & white in PIL, it has its own ideas about thresholds.

- # We have to force it: if a pixel has any color at all, it's a '1'.

- bands = diff_image.split()

- graydiff_image = ImageChops.lighter(ImageChops.lighter(

- bands[0], bands[1]), bands[2])

- whitediff_image = (graydiff_image.point(lambda p: p > 0 and VALUES_PER_BAND)

- .convert('1', dither=Image.NONE))

- # Calculate the perceptual difference percentage.

- skpdiff_csv_dir = tempfile.mkdtemp()

+ # Get all diff images and values from skpdiff binary.

+ skpdiff_output_dir = tempfile.mkdtemp()

try:

- skpdiff_csv_output = os.path.join(skpdiff_csv_dir, 'skpdiff-output.csv')

+ skpdiff_summary_file = os.path.join(skpdiff_output_dir,

+ 'skpdiff-output.json')

+ skpdiff_rgbdiff_dir = os.path.join(skpdiff_output_dir, 'rgbDiff')

+ skpdiff_whitediff_dir = os.path.join(skpdiff_output_dir, 'whiteDiff')

expected_img = os.path.join(storage_root, expected_images_subdir,

str(expected_image_locator) + image_suffix)

actual_img = os.path.join(storage_root, actual_images_subdir,

str(actual_image_locator) + image_suffix)

+ # TODO: Call skpdiff ONCE for all image pairs, instead of calling it

+ # repeatedly. This will allow us to parallelize a lot more work.

find_run_binary.run_command(

[SKPDIFF_BINARY, '-p', expected_img, actual_img,

- '--csv', skpdiff_csv_output, '-d', 'perceptual'])

- with contextlib.closing(open(skpdiff_csv_output)) as csv_file:

- for row in csv.DictReader(csv_file):

- perceptual_similarity = float(row[' perceptual'].strip())

- if not 0 <= perceptual_similarity <= 1:

- # skpdiff outputs -1 if the images are different sizes. Treat any

- # output that does not lie in [0, 1] as having 0% perceptual

- # similarity.

- perceptual_similarity = 0

- # skpdiff returns the perceptual similarity, convert it to get the

- # perceptual difference percentage.

- self._perceptual_difference = 100 - (perceptual_similarity * 100)

+ '--jsonp', 'false',

+ '--output', skpdiff_summary_file,

+ '--differs', 'perceptual', 'different_pixels',

+ '--rgbDiffDir', skpdiff_rgbdiff_dir,

+ '--whiteDiffDir', skpdiff_whitediff_dir,

+ ])

+ # Get information out of the skpdiff_summary_file.

+ with contextlib.closing(open(skpdiff_summary_file)) as fp:

+ data = json.load(fp)

+ # For now, we can assume there is only one record in the output summary,

+ # since we passed skpdiff only one pair of images.

+ record = data['records'][0]

+ self._width = record['width']

+ self._height = record['height']

+ # TODO: make max_diff_per_channel a tuple instead of a list, because the

+ # structure is meaningful (first element is red, second is green, etc.)

+ # See http://stackoverflow.com/a/626871

+ self._max_diff_per_channel = [

+ record['maxRedDiff'], record['maxGreenDiff'], record['maxBlueDiff']]

+ rgb_diff_path = record['rgbDiffPath']

+ white_diff_path = record['whiteDiffPath']

+ per_differ_stats = record['diffs']

+ for stats in per_differ_stats:

+ differ_name = stats['differName']

+ if differ_name == 'different_pixels':

+ self._num_pixels_differing = stats['pointsOfInterest']

+ elif differ_name == 'perceptual':

+ perceptual_similarity = stats['result']

+ # skpdiff returns the perceptual similarity; convert it to get the

+ # perceptual difference percentage.

+ # skpdiff outputs -1 if the images are different sizes. Treat any

+ # output that does not lie in [0, 1] as having 0% perceptual

+ # similarity.

+ if not 0 <= perceptual_similarity <= 1:

+ perceptual_similarity = 0

+ self._perceptual_difference = 100 - (perceptual_similarity * 100)

+ # Store the rgbdiff and whitediff images generated above.

+ diff_image_locator = _get_difference_locator(

+ expected_image_locator=expected_image_locator,

+ actual_image_locator=actual_image_locator)

+ basename = str(diff_image_locator) + image_suffix

+ _mkdir_unless_exists(os.path.join(storage_root, RGBDIFFS_SUBDIR))

+ _mkdir_unless_exists(os.path.join(storage_root, WHITEDIFFS_SUBDIR))

+ # TODO: Modify skpdiff's behavior so we can tell it exactly where to

+ # write the image files into, rather than having to move them around

+ # after skpdiff writes them out.

+ shutil.copyfile(rgb_diff_path,

+ os.path.join(storage_root, RGBDIFFS_SUBDIR, basename))

+ shutil.copyfile(white_diff_path,

+ os.path.join(storage_root, WHITEDIFFS_SUBDIR, basename))

finally:

- shutil.rmtree(skpdiff_csv_dir)

- # Final touches on diff_image: use whitediff_image as an alpha mask.

- # Unchanged pixels are transparent; differing pixels are opaque.

- diff_image.putalpha(whitediff_image)

- # Store the diff and whitediff images generated above.

- diff_image_locator = _get_difference_locator(

- expected_image_locator=expected_image_locator,

- actual_image_locator=actual_image_locator)

- basename = str(diff_image_locator) + image_suffix

- _save_image(diff_image, os.path.join(

- storage_root, DIFFS_SUBDIR, basename))

- _save_image(whitediff_image, os.path.join(

- storage_root, WHITEDIFFS_SUBDIR, basename))

- # Calculate difference metrics.

- (self._width, self._height) = diff_image.size

- self._num_pixels_differing = (

- whitediff_image.histogram()[VALUES_PER_BAND - 1])

+ shutil.rmtree(skpdiff_output_dir)

def get_num_pixels_differing(self):

"""Returns the absolute number of pixels that differ."""

@@ -278,102 +281,18 @@ class ImageDiffDB(object):

# Utility functions

-def _max_per_band(histogram):

- """Given the histogram of an image, return the maximum value of each band

- (a.k.a. "color channel", such as R/G/B) across the entire image.

- Args:

- histogram: PIL histogram

- Returns the maximum value of each band within the image histogram, as a list.

- """

- max_per_band = []

- assert(len(histogram) % VALUES_PER_BAND == 0)

- num_bands = len(histogram) / VALUES_PER_BAND

- for band in xrange(num_bands):

- # Assuming that VALUES_PER_BAND is 256...

- # the 'R' band makes up indices 0-255 in the histogram,

- # the 'G' band makes up indices 256-511 in the histogram,

- # etc.

- min_index = band * VALUES_PER_BAND

- index = min_index + VALUES_PER_BAND

- while index > min_index:

- index -= 1

- if histogram[index] > 0:

- max_per_band.append(index - min_index)

- break

- return max_per_band

-def _generate_image_diff(image1, image2):

- """Wrapper for ImageChops.difference(image1, image2) that will handle some

- errors automatically, or at least yield more useful error messages.

- TODO(epoger): Currently, some of the images generated by the bots are RGBA

- and others are RGB. I'm not sure why that is. For now, to avoid confusion

- within the UI, convert all to RGB when diffing.

- Args:

- image1: a PIL image object

- image2: a PIL image object

- Returns: per-pixel diffs between image1 and image2, as a PIL image object

- """

- try:

- return ImageChops.difference(image1.convert('RGB'), image2.convert('RGB'))

- except ValueError:

- logging.error('Error diffing image1 [%s] and image2 [%s].' % (

- repr(image1), repr(image2)))

- raise

-def _download_and_open_image(local_filepath, url):

- """Open the image at local_filepath; if there is no file at that path,

- download it from url to that path and then open it.

+def _download_file(local_filepath, url):

+ """Download a file from url to local_filepath, unless it is already there.

Args:

local_filepath: path on local disk where the image should be stored

url: URL from which we can download the image if we don't have it yet

- Returns: a PIL image object

"""

if not os.path.exists(local_filepath):

_mkdir_unless_exists(os.path.dirname(local_filepath))

with contextlib.closing(urllib.urlopen(url)) as url_handle:

with open(local_filepath, 'wb') as file_handle:

shutil.copyfileobj(fsrc=url_handle, fdst=file_handle)

- return _open_image(local_filepath)

-def _open_image(filepath):

- """Wrapper for Image.open(filepath) that yields more useful error messages.

- Args:

- filepath: path on local disk to load image from

- Returns: a PIL image object

- """

- try:

- return Image.open(filepath)

- except IOError:

- # If we are unable to load an image from the file, delete it from disk

- # and we will try to fetch it again next time. Fixes http://skbug.com/2247

- logging.error('IOError loading image file %s ; deleting it.' % filepath)

- os.remove(filepath)

- raise

-def _save_image(image, filepath, format='PNG'):

- """Write an image to disk, creating any intermediate directories as needed.

- Args:

- image: a PIL image object

- filepath: path on local disk to write image to

- format: one of the PIL image formats, listed at

- http://effbot.org/imagingbook/formats.htm

- """

- _mkdir_unless_exists(os.path.dirname(filepath))

- image.save(filepath, format)

def _mkdir_unless_exists(path):

« no previous file with comments | « no previous file | gm/rebaseline_server/imagepair_test.py » ('j') | no next file with comments »