gm/rebaseline_server/imagediffdb.py - Issue 325413003: rebaseline_server: use just skpdiff, not Python Image Library

Unified Diff: gm/rebaseline_server/imagediffdb.py

Issue 325413003: rebaseline_server: use just skpdiff, not Python Image Library (Closed) Base URL: https://skia.googlesource.com/skia.git@master

Patch Set: Created 6 years, 6 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: gm/rebaseline_server/imagediffdb.py

diff --git a/gm/rebaseline_server/imagediffdb.py b/gm/rebaseline_server/imagediffdb.py

index 6b684143b03f256a6a4eee87d43447eabfe713f8..c7b9a75e2b8326f00cac7760f1879ada77e823e5 100644

--- a/gm/rebaseline_server/imagediffdb.py

+++ b/gm/rebaseline_server/imagediffdb.py

@@ -10,7 +10,7 @@ Calulate differences between image pairs, and store them in a database.

"""

import contextlib

-import csv

+import json

import logging

import os

import re

@@ -18,11 +18,6 @@ import shutil

import sys

import tempfile

import urllib

-try:

- from PIL import Image, ImageChops

-except ImportError:

- raise ImportError('Requires PIL to be installed; see '

- + 'http://www.pythonware.com/products/pil/')

# Set the PYTHONPATH to include the tools directory.

sys.path.append(

@@ -38,11 +33,9 @@ DEFAULT_IMAGES_SUBDIR = 'images'

DISALLOWED_FILEPATH_CHAR_REGEX = re.compile('[^\w\-]')

-DIFFS_SUBDIR = 'diffs'

+RGBDIFFS_SUBDIR = 'diffs'

WHITEDIFFS_SUBDIR = 'whitediffs'

-VALUES_PER_BAND = 256

# Keys used within DiffRecord dictionary representations.

# NOTE: Keep these in sync with static/constants.js

KEY__DIFFERENCES__MAX_DIFF_PER_CHANNEL = 'maxDiffPerChannel'

@@ -87,9 +80,8 @@ class DiffRecord(object):

actual_image_locator = _sanitize_locator(actual_image_locator)

# Download the expected/actual images, if we don't have them already.

- # TODO(rmistry): Add a parameter that makes _download_and_open_image raise

- # an exception if images are not found locally (instead of trying to

- # download them).

+ # TODO(rmistry): Add a parameter that just tries to use already-present

+ # image files rather than downloading them.

expected_image_file = os.path.join(

storage_root, expected_images_subdir,

str(expected_image_locator) + image_suffix)

@@ -97,81 +89,91 @@ class DiffRecord(object):

storage_root, actual_images_subdir,

str(actual_image_locator) + image_suffix)

try:

- expected_image = _download_and_open_image(

- expected_image_file, expected_image_url)

+ expected_image = _download_file(expected_image_file, expected_image_url)

except Exception:

logging.exception('unable to download expected_image_url %s to file %s' %

(expected_image_url, expected_image_file))

raise

try:

- actual_image = _download_and_open_image(

- actual_image_file, actual_image_url)

+ actual_image = _download_file(actual_image_file, actual_image_url)

except Exception:

logging.exception('unable to download actual_image_url %s to file %s' %

(actual_image_url, actual_image_file))

raise

- # Generate the diff image (absolute diff at each pixel) and

- # max_diff_per_channel.

- diff_image = _generate_image_diff(actual_image, expected_image)

- diff_histogram = diff_image.histogram()

- (diff_width, diff_height) = diff_image.size

- self._max_diff_per_channel = _max_per_band(diff_histogram)

- # Generate the whitediff image (any differing pixels show as white).

- # This is tricky, because when you convert color images to grayscale or

- # black & white in PIL, it has its own ideas about thresholds.

- # We have to force it: if a pixel has any color at all, it's a '1'.

- bands = diff_image.split()

- graydiff_image = ImageChops.lighter(ImageChops.lighter(

- bands[0], bands[1]), bands[2])

- whitediff_image = (graydiff_image.point(lambda p: p > 0 and VALUES_PER_BAND)

- .convert('1', dither=Image.NONE))

- # Calculate the perceptual difference percentage.

- skpdiff_csv_dir = tempfile.mkdtemp()

+ # EPOGER: check for 80 columns throughout

epoger 2014/06/12 07:02:07 These EPOGERs indicate changes that I *know* I wan

+ # Get all diff images and values from skpdiff binary.

+ skpdiff_output_dir = tempfile.mkdtemp()

try:

- skpdiff_csv_output = os.path.join(skpdiff_csv_dir, 'skpdiff-output.csv')

+ skpdiff_summary_file = os.path.join(skpdiff_output_dir,

+ 'skpdiff-output.json')

+ skpdiff_rgbdiff_dir = os.path.join(skpdiff_output_dir, 'rgbDiff')

+ skpdiff_whitediff_dir = os.path.join(skpdiff_output_dir, 'whiteDiff')

expected_img = os.path.join(storage_root, expected_images_subdir,

str(expected_image_locator) + image_suffix)

actual_img = os.path.join(storage_root, actual_images_subdir,

str(actual_image_locator) + image_suffix)

+ # TODO: Call skpdiff ONCE for all image pairs, instead of calling it

+ # repeatedly.

find_run_binary.run_command(

[SKPDIFF_BINARY, '-p', expected_img, actual_img,

- '--csv', skpdiff_csv_output, '-d', 'perceptual'])

- with contextlib.closing(open(skpdiff_csv_output)) as csv_file:

- for row in csv.DictReader(csv_file):

- perceptual_similarity = float(row[' perceptual'].strip())

- if not 0 <= perceptual_similarity <= 1:

- # skpdiff outputs -1 if the images are different sizes. Treat any

- # output that does not lie in [0, 1] as having 0% perceptual

- # similarity.

- perceptual_similarity = 0

- # skpdiff returns the perceptual similarity, convert it to get the

- # perceptual difference percentage.

- self._perceptual_difference = 100 - (perceptual_similarity * 100)

+ '--jsonp', 'false',

+ '--output', skpdiff_summary_file,

+ '--differs', 'perceptual', 'different_pixels',

epoger 2014/06/12 07:02:07 This is one cause of the slowdown... we just to te

djsollen 2014/06/12 13:27:00 If you're not specifying the number of threads it

epoger 2014/06/12 14:02:34 Good explanation, thanks. I definitely want to ex

+ '--rgbDiffDir', skpdiff_rgbdiff_dir,

+ '--whiteDiffDir', skpdiff_whitediff_dir,

+ ])

+ # Get information out of the skpdiff_summary_file.

+ with contextlib.closing(open(skpdiff_summary_file)) as fp:

+ data = json.load(fp)

+ # For now, we can assume there is only one record in the output summary,

+ # since we passed skpdiff only one pair of images.

+ record = data['records'][0]

+ self._width = record['width']

+ self._height = record['height']

+ self._max_diff_per_channel = [

+ record['maxRedDiff'], record['maxGreenDiff'], record['maxBlueDiff']]

+ per_differ_stats = record['diffs']

+ for stats in per_differ_stats:

+ differ_name = stats['differName']

+ if differ_name == 'different_pixels':

+ self._num_pixels_differing = stats['pointsOfInterest']

+ elif differ_name == 'perceptual':

+ perceptual_similarity = stats['result']

+ # skpdiff returns the perceptual similarity; convert it to get the

+ # perceptual difference percentage.

+ # skpdiff outputs -1 if the images are different sizes. Treat any

+ # output that does not lie in [0, 1] as having 0% perceptual

+ # similarity.

+ if not 0 <= perceptual_similarity <= 1:

+ perceptual_similarity = 0

+ self._perceptual_difference = 100 - (perceptual_similarity * 100)

+ # Store the rgbdiff and whitediff images generated above.

+ diff_image_locator = _get_difference_locator(

+ expected_image_locator=expected_image_locator,

+ actual_image_locator=actual_image_locator)

+ basename = str(diff_image_locator) + image_suffix

+ _mkdir_unless_exists(os.path.join(storage_root, RGBDIFFS_SUBDIR))

+ _mkdir_unless_exists(os.path.join(storage_root, WHITEDIFFS_SUBDIR))

+ # TODO: we could just os.rename() the file, if we knew that

+ # skpdiff_whitediff_dir was on the same filesystem. But it's not.

+ #

+ # EPOGER: instead of _find_single_file_in_dir(), we can now use

epoger 2014/06/12 07:02:07 If we could make skpdiff write its output directly

djsollen 2014/06/12 13:26:59 That shouldn't be too hard.

epoger 2014/06/12 14:02:34 The main problem is that right now you can tell sk

+ # rgbDiffPath and whiteDiffPath within the skpdiff summary

+ shutil.copyfile(_find_single_file_in_dir(skpdiff_rgbdiff_dir),

+ os.path.join(storage_root, RGBDIFFS_SUBDIR, basename))

+ shutil.copyfile(_find_single_file_in_dir(skpdiff_whitediff_dir),

+ os.path.join(storage_root, WHITEDIFFS_SUBDIR, basename))

finally:

- shutil.rmtree(skpdiff_csv_dir)

- # Final touches on diff_image: use whitediff_image as an alpha mask.

- # Unchanged pixels are transparent; differing pixels are opaque.

- diff_image.putalpha(whitediff_image)

- # Store the diff and whitediff images generated above.

- diff_image_locator = _get_difference_locator(

- expected_image_locator=expected_image_locator,

- actual_image_locator=actual_image_locator)

- basename = str(diff_image_locator) + image_suffix

- _save_image(diff_image, os.path.join(

- storage_root, DIFFS_SUBDIR, basename))

- _save_image(whitediff_image, os.path.join(

- storage_root, WHITEDIFFS_SUBDIR, basename))

- # Calculate difference metrics.

- (self._width, self._height) = diff_image.size

- self._num_pixels_differing = (

- whitediff_image.histogram()[VALUES_PER_BAND - 1])

+ shutil.rmtree(skpdiff_output_dir)

epoger 2014/06/12 07:02:07 All of these writing files and then deleting direc

+ # EPOGER: how many of these methods are no longer used?

def get_num_pixels_differing(self):

"""Returns the absolute number of pixels that differ."""

return self._num_pixels_differing

@@ -305,75 +307,34 @@ def _max_per_band(histogram):

return max_per_band

-def _generate_image_diff(image1, image2):

- """Wrapper for ImageChops.difference(image1, image2) that will handle some

- errors automatically, or at least yield more useful error messages.

- TODO(epoger): Currently, some of the images generated by the bots are RGBA

- and others are RGB. I'm not sure why that is. For now, to avoid confusion

- within the UI, convert all to RGB when diffing.

- Args:

- image1: a PIL image object

- image2: a PIL image object

- Returns: per-pixel diffs between image1 and image2, as a PIL image object

- """

- try:

- return ImageChops.difference(image1.convert('RGB'), image2.convert('RGB'))

- except ValueError:

- logging.error('Error diffing image1 [%s] and image2 [%s].' % (

- repr(image1), repr(image2)))

- raise

-def _download_and_open_image(local_filepath, url):

- """Open the image at local_filepath; if there is no file at that path,

- download it from url to that path and then open it.

+def _download_file(local_filepath, url):

+ """Download a file from url to local_filepath, unless it is already there.

Args:

local_filepath: path on local disk where the image should be stored

url: URL from which we can download the image if we don't have it yet

- Returns: a PIL image object

"""

if not os.path.exists(local_filepath):

_mkdir_unless_exists(os.path.dirname(local_filepath))

with contextlib.closing(urllib.urlopen(url)) as url_handle:

with open(local_filepath, 'wb') as file_handle:

shutil.copyfileobj(fsrc=url_handle, fdst=file_handle)

- return _open_image(local_filepath)

-def _open_image(filepath):

- """Wrapper for Image.open(filepath) that yields more useful error messages.

- Args:

- filepath: path on local disk to load image from

- Returns: a PIL image object

- """

- try:

- return Image.open(filepath)

- except IOError:

- # If we are unable to load an image from the file, delete it from disk

- # and we will try to fetch it again next time. Fixes http://skbug.com/2247

- logging.error('IOError loading image file %s ; deleting it.' % filepath)

- os.remove(filepath)

- raise

+def _find_single_file_in_dir(dirpath):

+ """Returns the full path of the lone file within this directory.

-def _save_image(image, filepath, format='PNG'):

- """Write an image to disk, creating any intermediate directories as needed.

+ If the directory does not exist, contains no files, or contains multiple

+ files, this will raise an exception.

Args:

- image: a PIL image object

- filepath: path on local disk to write image to

- format: one of the PIL image formats, listed at

- http://effbot.org/imagingbook/formats.htm

+ dirpath: path to a directory on local disk

"""

- _mkdir_unless_exists(os.path.dirname(filepath))

- image.save(filepath, format)

+ filenames = os.listdir(dirpath)

+ if len(filenames) != 1:

+ raise Exception('dir %s does not contain exactly one file: %s' % (

+ dirpath, filenames))

+ return os.path.join(dirpath, filenames[0])

def _mkdir_unless_exists(path):

« no previous file with comments | « no previous file | gm/rebaseline_server/imagepair_test.py » ('j') | gm/rebaseline_server/imagepair_test.py » ('J')