telemetry/telemetry/wpr/archive_info2.py - Issue 2626373004: [WPR] Implement platform dependent recordings for WPR archives.

Unified Diff: telemetry/telemetry/wpr/archive_info2.py

Issue 2626373004: [WPR] Implement platform dependent recordings for WPR archives. (Closed)

Patch Set: Rebase Created 3 years, 11 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Index: telemetry/telemetry/wpr/archive_info2.py

diff --git a/telemetry/telemetry/wpr/archive_info.py b/telemetry/telemetry/wpr/archive_info2.py

similarity index 66%

copy from telemetry/telemetry/wpr/archive_info.py

copy to telemetry/telemetry/wpr/archive_info2.py

index 326da2d36b7411bcd7a7db5aa1212dc1f4991ab2..d8c3f95dbc000639f76b73265a7c9f4164aa0ea5 100644

--- a/telemetry/telemetry/wpr/archive_info.py

+++ b/telemetry/telemetry/wpr/archive_info2.py

@@ -12,6 +12,14 @@ import tempfile

from py_utils import cloud_storage # pylint: disable=import-error

+_DEFAULT_PLATFORM = 'DEFAULT'

+_ALL_PLATFORMS = ['mac', 'linux', 'android', 'win', _DEFAULT_PLATFORM]

+# TODO(rnephew): Move this file to archive_info.py when it is the default.

+# These changes were chosen to not be merged with archive_info.py directly

+# because all code in archive_info.py will be deleted once everything is

+# switched to using this version.

def AssertValidCloudStorageBucket(bucket):

is_valid = bucket in (None,

cloud_storage.PUBLIC_BUCKET,

@@ -21,10 +29,6 @@ def AssertValidCloudStorageBucket(bucket):

raise ValueError("Cloud storage privacy bucket %s is invalid" % bucket)

-class ArchiveError(Exception):

- pass

class WprArchiveInfo(object):

def __init__(self, file_path, data, bucket):

AssertValidCloudStorageBucket(bucket)

@@ -32,34 +36,29 @@ class WprArchiveInfo(object):

self._base_dir = os.path.dirname(file_path)

self._data = data

self._bucket = bucket

+ self.temp_target_wpr_file_path = None

# Ensure directory exists.

if not os.path.exists(self._base_dir):

os.makedirs(self._base_dir)

- # Map from the relative path (as it appears in the metadata file) of the

- # .wpr file to a list of story names it supports.

- self._wpr_file_to_story_names = data['archives']

- # Map from the story name to a relative path (as it appears

- # in the metadata file) of the .wpr file.

- self._story_name_to_wpr_file = dict()

- # Find out the wpr file names for each story.

- for wpr_file in data['archives']:

- story_names = data['archives'][wpr_file]

- for story_name in story_names:

- self._story_name_to_wpr_file[story_name] = wpr_file

- self.temp_target_wpr_file_path = None

+ assert data.get('platform_specific', False), (

+ 'archive_info2.WprArchiveInfo is exclusively for platform specific WPR '

+ 'archives. Platform agnostic archives should use '

+ 'archive_info.WprArchiveInfo archive_info2 will become archive_info '

+ 'once all data files are switched.')

+ self._story_name_to_wpr_file = data['archives']

@classmethod

def FromFile(cls, file_path, bucket):

+ """ Generates an archive_info2 instance with the given json file. """

if os.path.exists(file_path):

with open(file_path, 'r') as f:

data = json.load(f)

return cls(file_path, data, bucket)

return cls(file_path, {'archives': {}}, bucket)

- def DownloadArchivesIfNeeded(self):

+ def DownloadArchivesIfNeeded(self, target_platforms=None):

"""Downloads archives iff the Archive has a bucket parameter and the user

has permission to access the bucket.

@@ -71,23 +70,28 @@ class WprArchiveInfo(object):

permission to access the archive's bucket but a local copy of the archive

exists.

"""

+ # If no target platform is set, download all platforms.

+ if target_platforms is None:

+ target_platforms = _ALL_PLATFORMS

+ else:

+ assert isinstance(target_platforms, list), 'Must pass platforms as a list'

+ target_platforms = target_platforms + [_DEFAULT_PLATFORM]

# Download all .wpr files.

if not self._bucket:

logging.warning('Story set in %s has no bucket specified, and '

'cannot be downloaded from cloud_storage.', )

return

- assert 'archives' in self._data, 'Invalid data format in %s. \'archives\'' \

- ' field is needed' % self._file_path

- for archive_path in self._data['archives']:

- archive_path = self._WprFileNameToPath(archive_path)

+ assert 'archives' in self._data, ("Invalid data format in %s. 'archives' "

+ "field is needed" % self._file_path)

+ def download_if_needed(path):

try:

- cloud_storage.GetIfChanged(archive_path, self._bucket)

+ cloud_storage.GetIfChanged(path, self._bucket)

except (cloud_storage.CredentialsError, cloud_storage.PermissionError):

- if os.path.exists(archive_path):

- # If the archive exists, assume the user recorded their own and

- # simply warn.

- logging.warning('Need credentials to update WPR archive: %s',

- archive_path)

+ if os.path.exists(path):

+ # If the archive exists, assume the user recorded their own and warn

+ # them that they do not have the proper credentials to download.

+ logging.warning('Need credentials to update WPR archive: %s', path)

else:

logging.error("You either aren't authenticated or don't have "

"permission to use the archives for this page set."

@@ -97,16 +101,27 @@ class WprArchiveInfo(object):

"upload_to_cloud_storage")

raise

- def WprFilePathForStory(self, story):

+ story_archives = self._data['archives']

+ for story in story_archives:

+ for target_platform in target_platforms:

+ if story_archives[story].get(target_platform):

+ archive_path = self._WprFileNameToPath(

+ story_archives[story][target_platform])

+ download_if_needed(archive_path)

+ def WprFilePathForStory(self, story, target_platform=_DEFAULT_PLATFORM):

if self.temp_target_wpr_file_path:

return self.temp_target_wpr_file_path

wpr_file = self._story_name_to_wpr_file.get(story.display_name, None)

if wpr_file is None and hasattr(story, 'url'):

# Some old pages always use the URL to identify a page rather than the

# display_name, so try to look for that.

wpr_file = self._story_name_to_wpr_file.get(story.url, None)

if wpr_file:

- return self._WprFileNameToPath(wpr_file)

+ if target_platform in wpr_file:

+ return self._WprFileNameToPath(wpr_file[target_platform])

+ return self._WprFileNameToPath(wpr_file[_DEFAULT_PLATFORM])

return None

def AddNewTemporaryRecording(self, temp_wpr_file_path=None):

@@ -115,14 +130,17 @@ class WprArchiveInfo(object):

os.close(temp_wpr_file_handle)

self.temp_target_wpr_file_path = temp_wpr_file_path

- def AddRecordedStories(self, stories, upload_to_cloud_storage=False):

+ def AddRecordedStories(self, stories, upload_to_cloud_storage=False,

+ target_platform=_DEFAULT_PLATFORM):

if not stories:

os.remove(self.temp_target_wpr_file_path)

return

(target_wpr_file, target_wpr_file_path) = self._NextWprFileName()

for story in stories:

- self._SetWprFileForStory(story.display_name, target_wpr_file)

+ # Check to see if the platform has been manually overrided.

+ self._SetWprFileForStory(

+ story.display_name, target_wpr_file, target_platform)

shutil.move(self.temp_target_wpr_file_path, target_wpr_file_path)

# Update the hash file.

@@ -132,7 +150,6 @@ class WprArchiveInfo(object):

f.flush()

self._WriteToFile()

- self._DeleteAbandonedWprFiles()

# Upload to cloud storage

if upload_to_cloud_storage:

@@ -147,38 +164,14 @@ class WprArchiveInfo(object):

logging.warning('Failed to upload wpr file %s to cloud storage. '

'Error:%s' % target_wpr_file_path, e)

- def _DeleteAbandonedWprFiles(self):

- # Update the metadata so that the abandoned wpr files don't have

- # empty story name arrays.

- abandoned_wpr_files = self._AbandonedWprFiles()

- for wpr_file in abandoned_wpr_files:

- del self._wpr_file_to_story_names[wpr_file]

- # Don't fail if we're unable to delete some of the files.

- wpr_file_path = self._WprFileNameToPath(wpr_file)

- try:

- os.remove(wpr_file_path)

- except Exception:

- logging.warning('Failed to delete file: %s' % wpr_file_path)

- def _AbandonedWprFiles(self):

- abandoned_wpr_files = []

- for wpr_file, story_names in (

- self._wpr_file_to_story_names.iteritems()):

- if not story_names:

- abandoned_wpr_files.append(wpr_file)

- return abandoned_wpr_files

def _WriteToFile(self):

"""Writes the metadata into the file passed as constructor parameter."""

metadata = dict()

metadata['description'] = (

'Describes the Web Page Replay archives for a story set. '

'Don\'t edit by hand! Use record_wpr for updating.')

- metadata['archives'] = self._wpr_file_to_story_names.copy()

- # Don't write data for abandoned archives.

- abandoned_wpr_files = self._AbandonedWprFiles()

- for wpr_file in abandoned_wpr_files:

- del metadata['archives'][wpr_file]

+ metadata['archives'] = self._story_name_to_wpr_file.copy()

+ metadata['platform_specific'] = True

with open(self._file_path, 'w') as f:

json.dump(metadata, f, indent=4, sort_keys=True, separators=(',', ': '))

@@ -192,7 +185,12 @@ class WprArchiveInfo(object):

# The names are of the format "some_thing_number.wpr". Read the numbers.

highest_number = -1

base = None

- for wpr_file in self._wpr_file_to_story_names:

+ wpr_files = []

+ for story in self._data['archives']:

+ for p in self._data['archives'][story]:

+ wpr_files.append(self._data['archives'][story][p])

+ for wpr_file in wpr_files:

match = re.match(r'(?P<BASE>.*)_(?P<NUMBER>[0-9]+)\.wpr', wpr_file)

if not match:

raise Exception('Illegal wpr file name ' + wpr_file)

@@ -208,12 +206,10 @@ class WprArchiveInfo(object):

new_filename = '%s_%03d.wpr' % (base, highest_number + 1)

return new_filename, self._WprFileNameToPath(new_filename)

- def _SetWprFileForStory(self, story_name, wpr_file):

+ def _SetWprFileForStory(self, story_name, wpr_file, target_platform):

"""For modifying the metadata when we're going to record a new archive."""

- old_wpr_file = self._story_name_to_wpr_file.get(story_name, None)

- if old_wpr_file:

- self._wpr_file_to_story_names[old_wpr_file].remove(story_name)

- self._story_name_to_wpr_file[story_name] = wpr_file

- if wpr_file not in self._wpr_file_to_story_names:

- self._wpr_file_to_story_names[wpr_file] = []

- self._wpr_file_to_story_names[wpr_file].append(story_name)

+ if story_name not in self._data['archives']:

+ # If there is no other recording we want the first to be the default

+ # until a new default is recorded.

+ self._data['archives'][story_name] = {_DEFAULT_PLATFORM: wpr_file}

+ self._data['archives'][story_name][target_platform] = wpr_file

« no previous file with comments | « telemetry/telemetry/wpr/archive_info.py ('k') | telemetry/telemetry/wpr/archive_info2_unittest.py » ('j') | no next file with comments »