tools/android/loading/sandwich_misc.py - Issue 1872313002: sandwich: Implement SandwichTaskBuilder

Unified Diff: tools/android/loading/sandwich_misc.py

Issue 1872313002: sandwich: Implement SandwichTaskBuilder (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Created 4 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: tools/android/loading/sandwich_misc.py

diff --git a/tools/android/loading/sandwich_misc.py b/tools/android/loading/sandwich_misc.py

index 13988c3fcf7c59547144188b8285619bb74a19bb..fd0f363a319c722043b6a93b9e42002ea2ecf466 100644

--- a/tools/android/loading/sandwich_misc.py

+++ b/tools/android/loading/sandwich_misc.py

@@ -3,11 +3,14 @@

# found in the LICENSE file.

import logging

+import json

+import os

+import chrome_cache

+import common_util

from loading_trace import LoadingTrace

from prefetch_view import PrefetchSimulationView

from request_dependencies_lens import RequestDependencyLens

-from user_satisfied_lens import FirstContentfulPaintLens

import wpr_backend

@@ -114,3 +117,127 @@ def ExtractDiscoverableUrls(loading_trace_path, subresource_discoverer):

logging.info('white-listing %s' % request.url)

whitelisted_urls.add(request.url)

return whitelisted_urls

+def CompareUrlSet(ref_url_set, url_set, url_set_name, debug_hint='Good luck!'):

+ """Compare URL sets

+ Args:

+ ref_url_set: Set of reference urls.

+ url_set: Set of urls to compare to the reference.

+ url_set_name: The set name for logging purposes.

+ debug_hint: A debug hint to help debugging in any case the sets are

+ different.

+ """

+ assert type(ref_url_set) == set

+ assert type(url_set) == set

+ if ref_url_set == url_set:

+ logging.info(' %d %s are matching.' % (len(ref_url_set), url_set_name))

+ return

+ logging.error(' %s are not matching.' % url_set_name)

+ logging.error(' Hint: ' + debug_hint)

+ logging.error(' List of missing resources:')

+ for url in ref_url_set.difference(url_set):

+ logging.error('- ' + url)

+ logging.error(' List of unexpected resources:')

+ for url in url_set.difference(ref_url_set):

+ logging.error('+ ' + url)

+def _ListUrlRequests(trace, from_cache=None):

+ urls = set()

+ for request_event in trace.request_track.GetEvents():

+ if request_event.protocol == None:

+ continue

+ if not request_event.protocol.startswith('http'):

+ continue

+ if from_cache is not None and request_event.from_disk_cache != from_cache:

+ continue

+ urls.add(request_event.url)

+ return urls

+def VerifyBenchmarkOutputDirectory(benchmark_setup_path,

+ benchmark_output_directory_path):

+ """Verifies that all run inside the run_output_directory worked as expected.

+ Args:

+ benchmark_setup_path: Path of the JSON of the benchmark setup.

+ benchmark_output_directory_path: Path of the benchmark output directory to

+ verify.

+ """

+ benchmark_setup = json.load(open(benchmark_setup_path))

+ cache_whitelist = set(benchmark_setup['cache_whitelist'])

+ url_resources = set(benchmark_setup['url_resources'])

+ # Verify requests from traces.

+ run_id = -1

+ while True:

+ run_id += 1

+ run_path = os.path.join(benchmark_output_directory_path, str(run_id))

+ if not os.path.isdir(run_path):

+ break

+ trace_path = os.path.join(run_path, 'trace.json')

+ if not os.path.isfile(trace_path):

+ logging.error('missing trace %s' % trace_path)

+ continue

+ trace = LoadingTrace.FromJsonFile(trace_path)

+ logging.info('verifying %s from %s' % (trace.url, trace_path))

+ CompareUrlSet(url_resources, _ListUrlRequests(trace), 'All resources',

+ 'You may have an issue with an AJAX requests.')

+ CompareUrlSet(url_resources.intersection(cache_whitelist),

+ _ListUrlRequests(trace, True), 'Cached resources',

+ 'The WPR archive patcher may have an invalidation issue.')

+ CompareUrlSet(url_resources.difference(cache_whitelist),

+ _ListUrlRequests(trace, False), 'Non cached resources')

+def ListResourcesUrls(benchmark_output_directory_path):

+ """Lists all requested urls per navigated urls

+ Args:

+ benchmark_output_directory_path: Path of the benchmark output directory to

+ verify.

+ Returns:

+ {url -> [urls of sub-resources]}

+ """

+ url_subresources = {}

+ run_id = -1

+ while True:

+ run_id += 1

+ run_path = os.path.join(benchmark_output_directory_path, str(run_id))

+ if not os.path.isdir(run_path):

+ break

+ trace_path = os.path.join(run_path, 'trace.json')

+ if not os.path.isfile(trace_path):

+ continue

+ trace = LoadingTrace.FromJsonFile(trace_path)

+ if trace.url in url_subresources:

+ continue

+ logging.info('lists resources of %s from %s' % (trace.url, trace_path))

+ urls_set = set()

+ for request_event in trace.request_track.GetEvents():

+ if not request_event.protocol.startswith('http'):

+ continue

+ if request_event.url not in urls_set:

+ logging.info(' %s' % request_event.url)

+ urls_set.add(request_event.url)

+ url_subresources[trace.url] = [url for url in urls_set]

+ return url_subresources

+def ValidateCacheArchiveContent(ref_urls, cache_archive_path):

+ """Validates a cache archive content.

+ Args:

+ ref_urls: Reference list of urls.

+ cache_archive_path: Cache archive's path to validate.

+ """

+ logging.info('lists cached urls from %s' % cache_archive_path)

+ with common_util.TemporaryDirectory() as cache_directory:

+ chrome_cache.UnzipDirectoryContent(cache_archive_path, cache_directory)

+ cached_urls = \

+ chrome_cache.CacheBackend(cache_directory, 'simple').ListKeys()

+ CompareUrlSet(set(ref_urls), set(cached_urls), 'cached resources',

+ debug_hint='Looks like a response header needs to be patched.')

« tools/android/loading/sandwich.py ('K') | « tools/android/loading/sandwich.py ('k') | tools/android/loading/sandwich_tasks.py » ('j') | tools/android/loading/sandwich_tasks.py » ('J')