Chromium Code Reviews| Index: tools/skpdiff/skpdiff_server.py |
| diff --git a/tools/skpdiff/skpdiff_server.py b/tools/skpdiff/skpdiff_server.py |
| index 79ffc839e25064e97d3c117f1879b999b9ffcae5..c3594f082bad60c1521efa1bbe5079f07fffd52a 100755 |
| --- a/tools/skpdiff/skpdiff_server.py |
| +++ b/tools/skpdiff/skpdiff_server.py |
| @@ -8,6 +8,7 @@ import json |
| import os |
| import os.path |
| import re |
| +import subprocess |
| import sys |
| import tempfile |
| import urllib2 |
| @@ -99,7 +100,7 @@ def download_gm_image(image_name, image_path, hash_val): |
| @param hash_val The hash value of the image. |
| """ |
| - # Seperate the test name from a image name |
| + # Separate the test name from a image name |
| image_match = IMAGE_FILENAME_RE.match(image_name) |
| test_name = image_match.group(1) |
| @@ -111,71 +112,6 @@ def download_gm_image(image_name, image_path, hash_val): |
| download_file(image_url, image_path) |
| -def download_changed_images(expectations_dir, expected_name, updated_name, |
| - expected_image_dir, actual_image_dir): |
| - |
| - """Download the expected and actual GMs that changed into the given paths. |
| - Determining what changed will be done by comparing each expected_name JSON |
| - results file to its corresponding updated_name JSON results file if it |
| - exists. |
| - |
| - @param expectations_dir The directory to traverse for results files. This |
| - should resmble expectations/gm in the Skia trunk. |
| - @param expected_name The name of the expected result files. These are |
| - in the format of expected-results.json. |
| - @param updated_name The name of the updated expected result files. |
| - Normally this matches --expectations-filename-output for the |
| - rebaseline.py tool. |
| - @param expected_image_dir The directory to place downloaded expected images |
| - into. |
| - @param actual_image_dir The directory to place downloaded actual images |
| - into. |
| - """ |
| - |
| - differ = jsondiff.GMDiffer() |
| - |
| - # Look through expectations for hashes that changed |
| - for root, dirs, files in os.walk(expectations_dir): |
| - for expectation_file in files: |
| - # There are many files in the expectations directory. We only care |
| - # about expected results. |
| - if expectation_file != expected_name: |
| - continue |
| - |
| - # Get the name of the results file, and be sure there is an updated |
| - # result to compare against. If there is not, there is no point in |
| - # diffing this device. |
| - expected_file_path = os.path.join(root, expected_name) |
| - updated_file_path = os.path.join(root, updated_name) |
| - if not os.path.isfile(updated_file_path): |
| - continue |
| - |
| - # Find all expectations that did not match. |
| - expected_diff = differ.GenerateDiffDict(expected_file_path, |
| - updated_file_path) |
| - |
| - # The name of the device corresponds to the name of the folder we |
| - # are in. |
| - device_name = os.path.basename(root) |
| - |
| - # Create name prefixes to store the devices old and new GM results |
| - expected_image_prefix = os.path.join(expected_image_dir, |
| - device_name) + '-' |
| - |
| - actual_image_prefix = os.path.join(actual_image_dir, |
| - device_name) + '-' |
| - |
| - # Download each image that had a differing result |
| - for image_name, hashes in expected_diff.iteritems(): |
| - print('Downloading', image_name, 'for device', device_name) |
| - download_gm_image(image_name, |
| - expected_image_prefix + image_name, |
| - hashes['old']) |
| - download_gm_image(image_name, |
| - actual_image_prefix + image_name, |
| - hashes['new']) |
| - |
| - |
| def get_image_set_from_skpdiff(skpdiff_records): |
| """Get the set of all images references in the given records. |
| @@ -186,6 +122,204 @@ def get_image_set_from_skpdiff(skpdiff_records): |
| return expected_set | actual_set |
| +def set_expected_hash_in_json(expected_results_json, image_name, hash_value): |
| + """Set the expected hash for the object extracted from |
| + expected-results.json. |
| + |
| + @param expected_results_json The Python dictionary with the results to |
| + modify. |
| + @param image_name The name of the image to set the hash of. |
| + @param hash_value The hash to set for the image. |
| + """ |
| + expected_results = expected_results_json[gm_json.JSONKEY_EXPECTEDRESULTS] |
| + |
| + if image_name in expected_results: |
| + expected_results[image_name][gm_json.JSONKEY_EXPECTEDRESULTS_ALLOWEDDIGESTS][0][1] = hash_value |
|
Zach Reizner
2013/08/01 22:24:40
Curse you 80 character line length.
epoger
2013/08/02 14:33:06
Indeed.
If you want to, you can split it like so
Zach Reizner
2013/08/02 21:30:58
I do not want to.
epoger
2013/08/06 15:26:43
Fine, be that way.
|
| + else: |
| + expected_results[image_name] = { |
| + gm_json.JSONKEY_EXPECTEDRESULTS_ALLOWEDDIGESTS: |
| + [ |
| + [ |
| + 'bitmap-64bitMD5', |
|
epoger
2013/08/02 14:33:06
please use the constant reference to this string v
Zach Reizner
2013/08/02 21:30:58
Done.
|
| + hash_value |
| + ] |
| + ] |
| + } |
| + |
| + |
| +def get_git_version(path): |
|
epoger
2013/08/02 14:33:06
IMHO, get_head_version or get_base_version would b
Zach Reizner
2013/08/02 21:30:58
Done.
|
| + """Get the version of the file at the given path stored inside the HEAD of |
| + the git repository. It is returned as a string. |
| + |
| + @param path The path of the file whose HEAD is returned. It is assumed the |
| + path is inside a git repo rooted at SKIA_ROOT_DIR. |
| + """ |
| + |
| + # git-show will only work with paths relative to the root of the git repo. |
|
epoger
2013/08/02 14:33:06
This is great, but FYI, git-show works with a path
Zach Reizner
2013/08/02 21:30:58
Thanks
|
| + # This ensures we give it that relative path. |
| + git_path = os.path.relpath(path, SKIA_ROOT_DIR) |
| + git_show_proc = subprocess.Popen(['git', 'show', 'HEAD:' + git_path], |
| + stdout=subprocess.PIPE) |
| + |
| + # When invoked outside a shell, git will output the last committed version |
| + # of the file directly to stdout. |
| + git_version_content, _ = git_show_proc.communicate() |
| + return git_version_content |
| + |
| + |
| +class ExpectationsManager: |
| + def __init__(self, expectations_dir, expected_name, updated_name, |
| + skpdiff_path): |
| + """ |
| + @param expectations_dir The directory to traverse for results files. |
| + This should resmble expectations/gm in the Skia trunk. |
| + @param expected_name The name of the expected result files. These |
| + are in the format of expected-results.json. |
| + @param updated_name The name of the updated expected result files. |
| + Normally this matches --expectations-filename-output for the |
|
epoger
2013/08/02 14:33:06
I don't understand why we need the updated expecte
Zach Reizner
2013/08/02 21:30:58
You make an excellent point.
Derek and I have bee
|
| + rebaseline.py tool. |
| + @param skpdiff_path The path used to execute the skpdiff command. |
| + """ |
| + self.expectations_dir = expectations_dir |
|
epoger
2013/08/02 14:33:06
Typically, we would use underscored (self._expecta
Zach Reizner
2013/08/02 21:30:58
Done.
|
| + self.expected_name = expected_name |
| + self.updated_name = updated_name |
| + self.skpdiff_path = skpdiff_path |
| + self.generate_gm_comparison() |
| + |
| + def generate_gm_comparison(self): |
| + """Generate all the data needed to compare GMs including downloading the |
| + changed images and comparing them skpdiff. |
|
epoger
2013/08/02 14:33:06
I think it would be clearer in bullet list form:
Zach Reizner
2013/08/02 21:30:58
Done.
|
| + """ |
| + # Create a temporary file tree that makes sense for skpdiff to operate |
| + # on. |
| + image_output_dir = tempfile.mkdtemp('skpdiff') |
| + expected_image_dir = os.path.join(image_output_dir, 'expected') |
| + actual_image_dir = os.path.join(image_output_dir, 'actual') |
| + os.mkdir(expected_image_dir) |
| + os.mkdir(actual_image_dir) |
| + |
| + # Download expected and actual images that differed into the temporary |
| + # file tree. |
| + self.download_changed_images(expected_image_dir, actual_image_dir) |
| + |
| + # Invoke skpdiff with our downloaded images and place its results in the |
| + # temporary directory. |
| + self.skpdiff_output_path = os.path.join(image_output_dir, |
| + 'skpdiff_output.json') |
| + skpdiff_cmd = SKPDIFF_INVOKE_FORMAT.format(self.skpdiff_path, |
| + self.skpdiff_output_path, |
| + expected_image_dir, |
| + actual_image_dir) |
| + os.system(skpdiff_cmd) |
| + |
| + def download_changed_images(self, expected_image_dir, actual_image_dir): |
|
epoger
2013/08/02 14:33:06
Ultimately, it would be good for us to have self-t
|
| + """Download the expected and actual GMs that changed into the given |
| + paths. Determining what changed will be done by comparing each |
| + expected_name JSON results file to its corresponding updated_name JSON |
| + results file if it exists. |
| + |
| + @param expected_image_dir The directory to place downloaded expected |
|
epoger
2013/08/02 14:33:06
maybe clearer to call this "The directory to downl
Zach Reizner
2013/08/02 21:30:58
Done.
|
| + into. |
| + @param actual_image_dir The directory to place downloaded actual |
| + images into. |
| + """ |
| + image_map = {} |
| + differ = jsondiff.GMDiffer() |
| + |
| + # Look through expectations for hashes that changed |
| + for root, dirs, files in os.walk(self.expectations_dir): |
| + for expectation_file in files: |
| + # There are many files in the expectations directory. We only |
| + # care about expected results. |
| + if expectation_file != self.expected_name: |
| + continue |
| + |
| + # Get the name of the results file, and be sure there is an |
| + # updated result to compare against. If there is not, there is |
| + # no point in diffing this device. |
| + expected_file_path = os.path.join(root, self.expected_name) |
| + updated_file_path = os.path.join(root, self.updated_name) |
| + if not os.path.isfile(updated_file_path): |
| + continue |
| + |
| + # Always get the expected results from git because we may have |
| + # changed them in a previous instance of the server. |
| + expected_contents = get_git_version(expected_file_path) |
| + updated_contents = None |
| + with open(updated_file_path, 'rb') as updated_file: |
| + updated_contents = updated_file.read() |
| + |
| + # Find all expectations that did not match. |
| + expected_diff = differ.GenerateDiffDictFromStrings( |
| + expected_contents, |
| + updated_contents) |
| + |
| + # The name of the device corresponds to the name of the folder |
| + # we are in. |
| + device_name = os.path.basename(root) |
| + |
| + # Creat name prefixes to store the device's old and new GM |
| + # results. |
| + expected_image_prefix = os.path.join(expected_image_dir, |
| + device_name) + '-' |
| + |
| + actual_image_prefix = os.path.join(actual_image_dir, |
| + device_name) + '-' |
| + |
| + # Download each image that had a differing result. We take care |
| + # to store metadata about each image so that we know about an |
| + # image from its path on disk alone. That is all we will know |
| + # after skpdiff outputs its results. |
| + for image_name, hashes in expected_diff.iteritems(): |
| + print('Downloading', image_name, 'for device', device_name) |
| + download_gm_image(image_name, |
| + expected_image_prefix + image_name, |
| + hashes['old']) |
| + image_map[expected_image_prefix + image_name] = ( |
| + device_name, image_name, hashes['old']) |
| + download_gm_image(image_name, |
| + actual_image_prefix + image_name, |
| + hashes['new']) |
| + image_map[actual_image_prefix + image_name] = ( |
| + device_name, image_name, hashes['new']) |
| + |
| + self.image_map = image_map |
| + |
| + def set_expected_hash(self, device_name, image_name, hash_value): |
| + """Set the expected hash for the image of the given device. This always |
| + writes directly to the expected results file of the given device |
| + |
| + @param device_name The name of the device to write the hash to. |
| + @param image_name The name of the image whose hash to set. |
| + @param hash_value The value of the hash to set. |
| + """ |
| + |
| + # Retrieve the expected results file as it is in the working tree |
| + json_path = os.path.join(self.expectations_dir, device_name, |
| + self.expected_name) |
| + expectations = gm_json.LoadFromFile(json_path) |
| + |
| + # Set the specified hash. |
| + set_expected_hash_in_json(expectations, image_name, hash_value) |
| + |
| + # Write it out to disk using gm_json to keep the formatting consistent. |
| + gm_json.WriteToFile(expectations, json_path) |
| + |
| + def use_hash_of(self, image_path): |
| + """Determine the hash of the image at the path using the records, and |
| + set it as the expected hash for its device and image config. |
| + |
| + @param image_path The path of the image as it was stored in the output |
| + of skpdiff_path |
| + """ |
| + |
| + # Get the metadata about the image at the path. |
| + device_name, image_name, hash_value = self.image_map[image_path] |
| + |
| + # Write out that image's hash directly to the expected results file. |
| + self.set_expected_hash(device_name, image_name, hash_value) |
| + |
| + |
| class SkPDiffHandler(BaseHTTPServer.BaseHTTPRequestHandler): |
| def send_file(self, file_path): |
| # Grab the extension if there is one |
| @@ -211,7 +345,6 @@ class SkPDiffHandler(BaseHTTPServer.BaseHTTPRequestHandler): |
| # under the dir_path. This is to prevent accidentally serving files |
| # outside the directory intended using symlinks, or '../'. |
| real_path = os.path.normpath(os.path.join(dir_path, file_path)) |
| - print(repr(real_path)) |
| if os.path.commonprefix([real_path, dir_path]) == dir_path: |
| if os.path.isfile(real_path): |
| self.send_file(real_path) |
| @@ -248,12 +381,26 @@ class SkPDiffHandler(BaseHTTPServer.BaseHTTPRequestHandler): |
| # If no file to send was found, just give the standard 404 |
| self.send_error(404) |
| + def do_POST(self): |
| + if self.path == '/set_hash': |
| + content_length = int(self.headers['Content-length']) |
| + request_data = json.loads(self.rfile.read(content_length)) |
| + self.server.expectations_manager.use_hash_of(request_data['path']) |
| + self.send_response(200) |
| + self.send_header('Content-type', 'application/json') |
| + self.end_headers() |
| + self.wfile.write('{"success":true}') |
| + return |
| + |
| + # If the we have no handler for this path, give em' the 404 |
| + self.send_error(404) |
| -def run_server(skpdiff_output_path, port=8080): |
| + |
| +def run_server(expectations_manager, port=8080): |
| # Preload the skpdiff results file. This is so we can perform some |
| # processing on it. |
| skpdiff_output_json = '' |
| - with open(skpdiff_output_path, 'rb') as records_file: |
| + with open(expectations_manager.skpdiff_output_path, 'rb') as records_file: |
| skpdiff_output_json = records_file.read() |
| # It's important to parse the results file so that we can make a set of |
| @@ -261,10 +408,14 @@ def run_server(skpdiff_output_path, port=8080): |
| skpdiff_records = json.loads(skpdiff_output_json)['records'] |
| image_set = get_image_set_from_skpdiff(skpdiff_records) |
| + for record in skpdiff_records: |
| + record['device'] = os.path.basename(record['baselinePath']) |
| + |
| # Add JSONP padding to the JSON because the web page expects it. It expects |
| # it because it was designed to run with or without a web server. Without a |
| # web server, the only way to load JSON is with JSONP. |
| - skpdiff_output_json = 'var SkPDiffRecords = ' + skpdiff_output_json |
| + skpdiff_output_json = ('var SkPDiffRecords = ' + |
| + json.dumps({'records': skpdiff_records}) + ';') |
| # Do not bind to interfaces other than localhost because the server will |
| # attempt to serve files relative to the root directory as a last resort |
| @@ -274,7 +425,8 @@ def run_server(skpdiff_output_path, port=8080): |
| http_server = BaseHTTPServer.HTTPServer(server_address, SkPDiffHandler) |
| http_server.image_set = image_set |
| http_server.skpdiff_output_json = skpdiff_output_json |
| - print('Navigate thine browser to: http://{}:{}'.format(*server_address)) |
| + http_server.expectations_manager = expectations_manager |
| + print('Navigate thine browser to: http://{}:{}/'.format(*server_address)) |
| http_server.serve_forever() |
| @@ -320,39 +472,19 @@ def main(): |
| if skpdiff_path is None: |
| sys.exit(1) |
| - # Create a temporary file tree that makes sense for skpdiff.to operate on |
| - image_output_dir = tempfile.mkdtemp('skpdiff') |
| - expected_image_dir = os.path.join(image_output_dir, 'expected') |
| - actual_image_dir = os.path.join(image_output_dir, 'actual') |
| - os.mkdir(expected_image_dir) |
| - os.mkdir(actual_image_dir) |
| - |
| # Print out the paths of things for easier debugging |
| print('script dir :', SCRIPT_DIR) |
| print('tools dir :', TOOLS_DIR) |
| print('root dir :', SKIA_ROOT_DIR) |
| print('expectations dir :', args['expectations_dir']) |
| print('skpdiff path :', skpdiff_path) |
| - print('tmp dir :', image_output_dir) |
| - print('expected image dir :', expected_image_dir) |
| - print('actual image dir :', actual_image_dir) |
| - |
| - # Download expected and actual images that differed into the temporary file |
| - # tree. |
| - download_changed_images(args['expectations_dir'], |
| - args['expected'], args['updated'], |
| - expected_image_dir, actual_image_dir) |
| - |
| - # Invoke skpdiff with our downloaded images and place its results in the |
| - # temporary directory. |
| - skpdiff_output_path = os.path.join(image_output_dir, 'skpdiff_output.json') |
| - skpdiff_cmd = SKPDIFF_INVOKE_FORMAT.format(skpdiff_path, |
| - skpdiff_output_path, |
| - expected_image_dir, |
| - actual_image_dir) |
| - os.system(skpdiff_cmd) |
| - |
| - run_server(skpdiff_output_path, port=args['port']) |
| + |
| + expectations_manager = ExpectationsManager(args['expectations_dir'], |
| + args['expected'], |
| + args['updated'], |
| + skpdiff_path) |
| + |
| + run_server(expectations_manager, port=args['port']) |
| if __name__ == '__main__': |
| main() |