Index: third_party/gsutil/gslib/tests/test_resumable_streaming.py |
diff --git a/third_party/gsutil/gslib/tests/test_resumable_streaming.py b/third_party/gsutil/gslib/tests/test_resumable_streaming.py |
new file mode 100644 |
index 0000000000000000000000000000000000000000..51df48bbcc78d88ac397d4f63362591402c5b98d |
--- /dev/null |
+++ b/third_party/gsutil/gslib/tests/test_resumable_streaming.py |
@@ -0,0 +1,267 @@ |
+# -*- coding: utf-8 -*- |
+# Copyright 2014 Google Inc. All Rights Reserved. |
+# |
+# Licensed under the Apache License, Version 2.0 (the "License"); |
+# you may not use this file except in compliance with the License. |
+# You may obtain a copy of the License at |
+# |
+# http://www.apache.org/licenses/LICENSE-2.0 |
+# |
+# Unless required by applicable law or agreed to in writing, software |
+# distributed under the License is distributed on an "AS IS" BASIS, |
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
+# See the License for the specific language governing permissions and |
+# limitations under the License. |
+"""Unit tests for resumable streaming upload functions and classes.""" |
+ |
+from __future__ import absolute_import |
+ |
+from hashlib import md5 |
+import os |
+import pkgutil |
+ |
+from gslib.exception import CommandException |
+from gslib.hashing_helper import CalculateHashesFromContents |
+from gslib.hashing_helper import CalculateMd5FromContents |
+from gslib.resumable_streaming_upload import ResumableStreamingJsonUploadWrapper |
+import gslib.tests.testcase as testcase |
+from gslib.util import GetJsonResumableChunkSize |
+from gslib.util import TRANSFER_BUFFER_SIZE |
+ |
+ |
+_TEST_FILE = 'test.txt' |
+ |
+ |
+class TestResumableStreamingJsonUploadWrapper(testcase.GsUtilUnitTestCase): |
+ """Unit tests for the TestResumableStreamingJsonUploadWrapper class.""" |
+ |
+ _temp_test_file = None |
+ _temp_test_file_contents = None |
+ _temp_test_file_len = None |
+ |
+ def _GetTestFile(self): |
+ if not self._temp_test_file: |
+ self._temp_test_file_contents = pkgutil.get_data( |
+ 'gslib', 'tests/test_data/%s' % _TEST_FILE) |
+ self._temp_test_file = self.CreateTempFile( |
+ file_name=_TEST_FILE, contents=self._temp_test_file_contents) |
+ self._temp_test_file_len = len(self._temp_test_file_contents) |
+ return self._temp_test_file |
+ |
+ def testReadInChunks(self): |
+ tmp_file = self._GetTestFile() |
+ with open(tmp_file, 'rb') as stream: |
+ wrapper = ResumableStreamingJsonUploadWrapper( |
+ stream, TRANSFER_BUFFER_SIZE, test_small_buffer=True) |
+ hash_dict = {'md5': md5()} |
+ # CalculateHashesFromContents reads in chunks, but does not seek. |
+ CalculateHashesFromContents(wrapper, hash_dict) |
+ with open(tmp_file, 'rb') as stream: |
+ actual = CalculateMd5FromContents(stream) |
+ self.assertEqual(actual, hash_dict['md5'].hexdigest()) |
+ |
+ def testReadInChunksWithSeekToBeginning(self): |
+ """Reads one buffer, then seeks to 0 and reads chunks until the end.""" |
+ tmp_file = self._GetTestFile() |
+ for initial_read in (TRANSFER_BUFFER_SIZE - 1, |
+ TRANSFER_BUFFER_SIZE, |
+ TRANSFER_BUFFER_SIZE + 1, |
+ TRANSFER_BUFFER_SIZE * 2 - 1, |
+ TRANSFER_BUFFER_SIZE * 2, |
+ TRANSFER_BUFFER_SIZE * 2 + 1, |
+ TRANSFER_BUFFER_SIZE * 3 - 1, |
+ TRANSFER_BUFFER_SIZE * 3, |
+ TRANSFER_BUFFER_SIZE * 3 + 1): |
+ for buffer_size in (TRANSFER_BUFFER_SIZE - 1, |
+ TRANSFER_BUFFER_SIZE, |
+ TRANSFER_BUFFER_SIZE + 1, |
+ self._temp_test_file_len - 1, |
+ self._temp_test_file_len, |
+ self._temp_test_file_len + 1): |
+ # Can't seek to 0 if the buffer is too small, so we expect an |
+ # exception. |
+ expect_exception = buffer_size < self._temp_test_file_len |
+ with open(tmp_file, 'rb') as stream: |
+ wrapper = ResumableStreamingJsonUploadWrapper( |
+ stream, buffer_size, test_small_buffer=True) |
+ wrapper.read(initial_read) |
+ # CalculateMd5FromContents seeks to 0, reads in chunks, then seeks |
+ # to 0 again. |
+ try: |
+ hex_digest = CalculateMd5FromContents(wrapper) |
+ if expect_exception: |
+ self.fail('Did not get expected CommandException for ' |
+ 'initial read size %s, buffer size %s' % |
+ (initial_read, buffer_size)) |
+ except CommandException, e: |
+ if not expect_exception: |
+ self.fail('Got unexpected CommandException "%s" for ' |
+ 'initial read size %s, buffer size %s' % |
+ (str(e), initial_read, buffer_size)) |
+ if not expect_exception: |
+ with open(tmp_file, 'rb') as stream: |
+ actual = CalculateMd5FromContents(stream) |
+ self.assertEqual( |
+ actual, hex_digest, |
+ 'Digests not equal for initial read size %s, buffer size %s' % |
+ (initial_read, buffer_size)) |
+ |
+ def _testSeekBack(self, initial_reads, buffer_size, seek_back_amount): |
+ """Tests reading then seeking backwards. |
+ |
+ This function simulates an upload that is resumed after a connection break. |
+ It reads one transfer buffer at a time until it reaches initial_position, |
+ then seeks backwards (as if the server did not receive some of the bytes) |
+ and reads to the end of the file, ensuring the data read after the seek |
+ matches the original file. |
+ |
+ Args: |
+ initial_reads: List of integers containing read sizes to perform |
+ before seek. |
+ buffer_size: Maximum buffer size for the wrapper. |
+ seek_back_amount: Number of bytes to seek backward. |
+ |
+ Raises: |
+ AssertionError on wrong data returned by the wrapper. |
+ """ |
+ tmp_file = self._GetTestFile() |
+ initial_position = 0 |
+ for read_size in initial_reads: |
+ initial_position += read_size |
+ self.assertGreaterEqual( |
+ buffer_size, seek_back_amount, |
+ 'seek_back_amount must be less than initial position %s ' |
+ '(but was actually: %s)' % (buffer_size, seek_back_amount)) |
+ self.assertLess( |
+ initial_position, self._temp_test_file_len, |
+ 'initial_position must be less than test file size %s ' |
+ '(but was actually: %s)' % (self._temp_test_file_len, initial_position)) |
+ |
+ with open(tmp_file, 'rb') as stream: |
+ wrapper = ResumableStreamingJsonUploadWrapper( |
+ stream, buffer_size, test_small_buffer=True) |
+ position = 0 |
+ for read_size in initial_reads: |
+ data = wrapper.read(read_size) |
+ self.assertEqual( |
+ self._temp_test_file_contents[position:position + read_size], |
+ data, 'Data from position %s to %s did not match file contents.' % |
+ (position, position + read_size)) |
+ position += len(data) |
+ wrapper.seek(initial_position - seek_back_amount) |
+ self.assertEqual(wrapper.tell(), |
+ initial_position - seek_back_amount) |
+ data = wrapper.read() |
+ self.assertEqual( |
+ self._temp_test_file_len - (initial_position - seek_back_amount), |
+ len(data), |
+ 'Unexpected data length with initial pos %s seek_back_amount %s. ' |
+ 'Expected: %s, actual: %s.' % |
+ (initial_position, seek_back_amount, |
+ self._temp_test_file_len - (initial_position - seek_back_amount), |
+ len(data))) |
+ self.assertEqual( |
+ self._temp_test_file_contents[-len(data):], data, |
+ 'Data from position %s to EOF did not match file contents.' % |
+ position) |
+ |
+ def testReadSeekAndReadToEOF(self): |
+ """Tests performing reads on the wrapper, seeking, then reading to EOF.""" |
+ for initial_reads in ([1], |
+ [TRANSFER_BUFFER_SIZE - 1], |
+ [TRANSFER_BUFFER_SIZE], |
+ [TRANSFER_BUFFER_SIZE + 1], |
+ [1, TRANSFER_BUFFER_SIZE - 1], |
+ [1, TRANSFER_BUFFER_SIZE], |
+ [1, TRANSFER_BUFFER_SIZE + 1], |
+ [TRANSFER_BUFFER_SIZE - 1, 1], |
+ [TRANSFER_BUFFER_SIZE, 1], |
+ [TRANSFER_BUFFER_SIZE + 1, 1], |
+ [TRANSFER_BUFFER_SIZE - 1, TRANSFER_BUFFER_SIZE - 1], |
+ [TRANSFER_BUFFER_SIZE - 1, TRANSFER_BUFFER_SIZE], |
+ [TRANSFER_BUFFER_SIZE - 1, TRANSFER_BUFFER_SIZE + 1], |
+ [TRANSFER_BUFFER_SIZE, TRANSFER_BUFFER_SIZE - 1], |
+ [TRANSFER_BUFFER_SIZE, TRANSFER_BUFFER_SIZE], |
+ [TRANSFER_BUFFER_SIZE, TRANSFER_BUFFER_SIZE + 1], |
+ [TRANSFER_BUFFER_SIZE + 1, TRANSFER_BUFFER_SIZE - 1], |
+ [TRANSFER_BUFFER_SIZE + 1, TRANSFER_BUFFER_SIZE], |
+ [TRANSFER_BUFFER_SIZE + 1, TRANSFER_BUFFER_SIZE + 1], |
+ [TRANSFER_BUFFER_SIZE, TRANSFER_BUFFER_SIZE, |
+ TRANSFER_BUFFER_SIZE]): |
+ initial_position = 0 |
+ for read_size in initial_reads: |
+ initial_position += read_size |
+ for buffer_size in (initial_position, |
+ initial_position + 1, |
+ initial_position * 2 - 1, |
+ initial_position * 2): |
+ for seek_back_amount in ( |
+ min(TRANSFER_BUFFER_SIZE - 1, initial_position), |
+ min(TRANSFER_BUFFER_SIZE, initial_position), |
+ min(TRANSFER_BUFFER_SIZE + 1, initial_position), |
+ min(TRANSFER_BUFFER_SIZE * 2 - 1, initial_position), |
+ min(TRANSFER_BUFFER_SIZE * 2, initial_position), |
+ min(TRANSFER_BUFFER_SIZE * 2 + 1, initial_position)): |
+ self._testSeekBack(initial_reads, buffer_size, seek_back_amount) |
+ |
+ def testBufferSizeLessThanChunkSize(self): |
+ ResumableStreamingJsonUploadWrapper(None, GetJsonResumableChunkSize()) |
+ try: |
+ ResumableStreamingJsonUploadWrapper(None, GetJsonResumableChunkSize() - 1) |
+ self.fail('Did not get expected CommandException') |
+ except CommandException, e: |
+ self.assertIn('Buffer size must be >= JSON resumable upload', str(e)) |
+ |
+ def testSeekPartialBuffer(self): |
+ """Tests seeking back partially within the buffer.""" |
+ tmp_file = self._GetTestFile() |
+ read_size = TRANSFER_BUFFER_SIZE |
+ with open(tmp_file, 'rb') as stream: |
+ wrapper = ResumableStreamingJsonUploadWrapper( |
+ stream, TRANSFER_BUFFER_SIZE * 3, test_small_buffer=True) |
+ position = 0 |
+ for _ in xrange(3): |
+ data = wrapper.read(read_size) |
+ self.assertEqual( |
+ self._temp_test_file_contents[position:position + read_size], |
+ data, 'Data from position %s to %s did not match file contents.' % |
+ (position, position + read_size)) |
+ position += len(data) |
+ |
+ data = wrapper.read(read_size / 2) |
+ # Buffer contents should now be have contents from: |
+ # read_size/2 through 7*read_size/2. |
+ position = read_size / 2 |
+ wrapper.seek(position) |
+ data = wrapper.read() |
+ self.assertEqual( |
+ self._temp_test_file_contents[-len(data):], data, |
+ 'Data from position %s to EOF did not match file contents.' % |
+ position) |
+ |
+ def testSeekEnd(self): |
+ tmp_file = self._GetTestFile() |
+ for buffer_size in (TRANSFER_BUFFER_SIZE - 1, |
+ TRANSFER_BUFFER_SIZE, |
+ TRANSFER_BUFFER_SIZE + 1): |
+ for seek_back in (TRANSFER_BUFFER_SIZE - 1, |
+ TRANSFER_BUFFER_SIZE, |
+ TRANSFER_BUFFER_SIZE + 1): |
+ expect_exception = seek_back > buffer_size |
+ with open(tmp_file, 'rb') as stream: |
+ wrapper = ResumableStreamingJsonUploadWrapper( |
+ stream, buffer_size, test_small_buffer=True) |
+ # Read to the end. |
+ while wrapper.read(TRANSFER_BUFFER_SIZE): |
+ pass |
+ try: |
+ wrapper.seek(seek_back, whence=os.SEEK_END) |
+ if expect_exception: |
+ self.fail('Did not get expected CommandException for ' |
+ 'seek_back size %s, buffer size %s' % |
+ (seek_back, buffer_size)) |
+ except CommandException, e: |
+ if not expect_exception: |
+ self.fail('Got unexpected CommandException "%s" for ' |
+ 'seek_back size %s, buffer size %s' % |
+ (str(e), seek_back, buffer_size)) |