Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(3020)

Side by Side Diff: tests/download_from_google_storage_unittests.py

Issue 12042069: Scripts to download files from google storage based on sha1 sums (Closed) Base URL: https://chromium.googlesource.com/chromium/tools/depot_tools.git@master
Patch Set: Updated messages, switched main thread to use stdout_queue Created 7 years, 9 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
(Empty)
1 #!/usr/bin/env python
2 # Copyright (c) 2012 The Chromium Authors. All rights reserved.
3 # Use of this source code is governed by a BSD-style license that can be
4 # found in the LICENSE file.
5
6 """Unit tests for download_from_google_storage.py."""
7
8 import os
9 import sys
10 import unittest
11 import threading
12 import Queue
13 import optparse
14
15 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
16
17 import upload_to_google_storage
18 import download_from_google_storage
19
20 # ../third_party/gsutil/gsutil
21 GSUTIL_DEFAULT_PATH = os.path.join(
22 os.path.dirname(os.path.dirname(os.path.abspath(__file__))),
23 'third_party', 'gsutil', 'gsutil')
24
25
26 class GsutilMock(object):
27 def __init__(self, path, boto_path=None, timeout=None):
28 self.path = path
29 self.timeout = timeout
30 self.boto_path = boto_path
31 self.expected = []
32 self.history = []
33 self.lock = threading.Lock()
34
35 def add_expected(self, return_code, out, err):
36 self.expected.append((return_code, out, err))
37
38 def append_history(self, method, args):
39 self.history.append((method, args))
40
41 def call(self, *args):
42 with self.lock:
43 self.append_history('call', args)
44 if self.expected:
45 return self.expected.pop(0)[0]
46 else:
47 return 0
48
49 def check_call(self, *args):
50 with self.lock:
51 self.append_history('check_call', args)
52 if self.expected:
53 return self.expected.pop(0)
54 else:
55 return (0, '', '')
M-A Ruel 2013/03/11 19:52:01 Interesting, usually I keep a reference to the Tes
56
57
58 class GstoolsUnitTests(unittest.TestCase):
59 def setUp(self):
60 self.base_path = os.path.join(
61 os.path.dirname(os.path.abspath(__file__)), 'gstools')
62
63 def test_gsutil(self):
64 gsutil = download_from_google_storage.Gsutil(GSUTIL_DEFAULT_PATH)
65 self.assertEquals(gsutil.path, GSUTIL_DEFAULT_PATH)
M-A Ruel 2013/03/11 19:52:01 Please use assertEqual() for new code, as per: htt
Ryan Tseng 2013/03/11 21:34:19 Done.
66 code, _, err = gsutil.check_call()
67 self.assertEquals(code, 0)
68 self.assertEquals(err, '')
69
70 def test_gsutil_version(self):
71 gsutil = download_from_google_storage.Gsutil(GSUTIL_DEFAULT_PATH)
72 _, _, err = gsutil.check_call('version')
73 err_lines = err.splitlines()
74 self.assertEquals(err_lines[0], 'gsutil version 3.25')
75 self.assertEquals(
76 err_lines[1],
77 'checksum ce71ac982f1148315e7fa65cff2f83e8 (OK)')
78
79 def test_get_sha1(self):
80 lorem_ipsum = os.path.join(self.base_path, 'lorem_ipsum.txt')
81 self.assertEquals(
82 download_from_google_storage.get_sha1(lorem_ipsum),
83 '7871c8e24da15bad8b0be2c36edc9dc77e37727f')
84
85 def test_get_md5(self):
86 lorem_ipsum = os.path.join(self.base_path, 'lorem_ipsum.txt')
87 self.assertEquals(
88 upload_to_google_storage.get_md5(lorem_ipsum),
89 '634d7c1ed3545383837428f031840a1e')
90
91 def test_get_md5_cached_read(self):
92 lorem_ipsum = os.path.join(self.base_path, 'lorem_ipsum.txt')
93 # Use a fake 'stale' MD5 sum. Expected behavior is to return stale sum.
94 self.assertEquals(
95 upload_to_google_storage.get_md5_cached(lorem_ipsum),
96 '734d7c1ed3545383837428f031840a1e')
97
98 def test_get_md5_cached_write(self):
99 lorem_ipsum2 = os.path.join(self.base_path, 'lorem_ipsum2.txt')
100 lorem_ipsum2_md5 = os.path.join(self.base_path, 'lorem_ipsum2.txt.md5')
101 if os.path.exists(lorem_ipsum2_md5):
102 os.remove(lorem_ipsum2_md5)
M-A Ruel 2013/03/11 19:52:01 Then use a temporary directory so no files are lea
Ryan Tseng 2013/03/11 21:34:19 Done.
103 # Use a fake 'stale' MD5 sum. Expected behavior is to return stale sum.
104 self.assertEquals(
105 upload_to_google_storage.get_md5_cached(lorem_ipsum2),
106 '4c02d1eb455a0f22c575265d17b84b6d')
107 self.assertTrue(os.path.exists(lorem_ipsum2_md5))
108 self.assertEquals(
109 open(lorem_ipsum2_md5, 'rb').read(),
110 '4c02d1eb455a0f22c575265d17b84b6d')
111 os.remove(lorem_ipsum2_md5) # Clean up.
112 self.assertFalse(os.path.exists(lorem_ipsum2_md5))
113
114
115 class DownloadTests(unittest.TestCase):
116 def setUp(self):
117 self.gsutil = GsutilMock(GSUTIL_DEFAULT_PATH)
118 self.base_path = os.path.join(
119 os.path.dirname(os.path.abspath(__file__)),
M-A Ruel 2013/03/11 19:52:01 Use a file-level variable. This code would break i
Ryan Tseng 2013/03/11 21:34:19 Done.
120 'gstools',
121 'download_test_data')
122 self.base_url = 'gs://sometesturl'
123 self.parser = optparse.OptionParser()
124 self.queue = Queue.Queue()
125 self.ret_codes = Queue.Queue()
126 self.lorem_ipsum = os.path.join(self.base_path, 'lorem_ipsum.txt')
127 self.lorem_ipsum_sha1 = '7871c8e24da15bad8b0be2c36edc9dc77e37727f'
128 self.maxDiff = None
129
130 def test_enumerate_files_non_recursive(self):
131 queue_size = download_from_google_storage.enumerate_work_queue(
132 self.base_path, self.queue, True, False, False, None, False)
133 result = list(self.queue.queue)
134 expected_queue = [
135 ('e6c4fbd4fe7607f3e6ebf68b2ea4ef694da7b4fe',
136 os.path.join(self.base_path, 'rootfolder_text.txt')),
137 ('7871c8e24da15bad8b0be2c36edc9dc77e37727f',
138 os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt'))]
139 for item in result:
140 self.assertTrue(item in expected_queue)
141 self.assertEquals(queue_size, 2)
142
143 def test_enumerate_files_recursive(self):
144 queue_size = download_from_google_storage.enumerate_work_queue(
145 self.base_path, self.queue, True, True, False, None, False)
146 expected_queue = [
147 ('e6c4fbd4fe7607f3e6ebf68b2ea4ef694da7b4fe',
148 os.path.join(self.base_path, 'rootfolder_text.txt')),
149 ('7871c8e24da15bad8b0be2c36edc9dc77e37727f',
150 os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt')),
151 ('b5415aa0b64006a95c0c409182e628881d6d6463',
152 os.path.join(self.base_path, 'subfolder', 'subfolder_text.txt'))]
153 result = list(self.queue.queue)
M-A Ruel 2013/03/11 19:52:01 self.assertEqual(sorted(expected_queue), sorted(se
Ryan Tseng 2013/03/11 21:34:19 Done. Keeping the queue_size check since its calc
154 for item in result:
155 self.assertTrue(item in expected_queue)
156 self.assertEquals(queue_size, 3)
157
158 def test_download_worker_single_file(self):
159 sha1_hash = '7871c8e24da15bad8b0be2c36edc9dc77e37727f'
160 input_filename = '%s/%s' % (self.base_url, sha1_hash)
161 output_filename = os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt')
162 self.queue.put((sha1_hash, output_filename))
163 self.queue.put((None, None))
164 stdout_queue = Queue.Queue()
165 # pylint: disable=W0212
M-A Ruel 2013/03/11 19:52:01 You can disable it at file level. It'll save a few
Ryan Tseng 2013/03/11 21:34:19 Done.
166 download_from_google_storage._downloader_worker_thread(
167 0, self.queue, False, self.base_url, self.gsutil,
168 stdout_queue, self.ret_codes)
169 expected_calls = [
170 ('check_call',
171 ('ls', input_filename)),
172 ('check_call',
173 ('cp', '-q', input_filename, output_filename))]
174 expected_output = [
175 '0> Downloading %s...' % output_filename]
176 expected_ret_codes = []
177 self.assertEquals(list(stdout_queue.queue), expected_output)
178 self.assertEquals(self.gsutil.history, expected_calls)
179 self.assertEquals(list(self.ret_codes.queue), expected_ret_codes)
180
181 def test_download_worker_skips_file(self):
182 sha1_hash = 'e6c4fbd4fe7607f3e6ebf68b2ea4ef694da7b4fe'
183 output_filename = os.path.join(self.base_path, 'rootfolder_text.txt')
184 self.queue.put((sha1_hash, output_filename))
185 self.queue.put((None, None))
186 stdout_queue = Queue.Queue()
187 # pylint: disable=W0212
188 download_from_google_storage._downloader_worker_thread(
189 0, self.queue, False, self.base_url, self.gsutil,
190 stdout_queue, self.ret_codes)
191 expected_output = [
192 '0> File %s exists and SHA1 matches. Skipping.' % output_filename
193 ]
194 self.assertEquals(list(stdout_queue.queue), expected_output)
195 self.assertEquals(self.gsutil.history, [])
196
197 def test_download_worker_skips_not_found_file(self):
198 sha1_hash = '7871c8e24da15bad8b0be2c36edc9dc77e37727f'
199 input_filename = '%s/%s' % (self.base_url, sha1_hash)
200 output_filename = os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt')
201 self.queue.put((sha1_hash, output_filename))
202 self.queue.put((None, None))
203 stdout_queue = Queue.Queue()
204 self.gsutil.add_expected(1, '', '') # Return error when 'ls' is called.
205 # pylint: disable=W0212
206 download_from_google_storage._downloader_worker_thread(
207 0, self.queue, False, self.base_url, self.gsutil,
208 stdout_queue, self.ret_codes)
209 expected_output = [
210 '0> File %s for %s does not exist, skipping.' % (
211 input_filename, output_filename),
212 ]
213 expected_calls = [
214 ('check_call',
215 ('ls', input_filename))
216 ]
217 expected_ret_codes = [
218 (1, 'File %s for %s does not exist.' % (
219 input_filename, output_filename))
220 ]
221 self.assertEquals(list(stdout_queue.queue), expected_output)
222 self.assertEquals(self.gsutil.history, expected_calls)
223 self.assertEquals(list(self.ret_codes.queue), expected_ret_codes)
224
225 def test_download_cp_fails(self):
226 sha1_hash = '7871c8e24da15bad8b0be2c36edc9dc77e37727f'
227 input_filename = '%s/%s' % (self.base_url, sha1_hash)
228 output_filename = os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt')
229 self.gsutil.add_expected(0, '', '')
230 self.gsutil.add_expected(101, '', 'Test error message.')
231 # pylint: disable=W0212
232 code = download_from_google_storage.download_from_google_storage(
233 input_filename=sha1_hash,
234 base_url=self.base_url,
235 gsutil=self.gsutil,
236 num_threads=1,
237 directory=False,
238 recursive=False,
239 force=True,
240 output=output_filename,
241 ignore_errors=False,
242 sha1_file=False)
243 expected_calls = [
244 ('check_call',
245 ('ls', input_filename)),
246 ('check_call',
247 ('cp', '-q', input_filename, output_filename))
248 ]
249 self.assertEquals(self.gsutil.history, expected_calls)
250 self.assertEquals(code, 101)
251
252 def test_download_directory_no_recursive_non_force(self):
253 sha1_hash = '7871c8e24da15bad8b0be2c36edc9dc77e37727f'
254 input_filename = '%s/%s' % (self.base_url, sha1_hash)
255 output_filename = os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt')
256 code = download_from_google_storage.download_from_google_storage(
257 input_filename=self.base_path,
258 base_url=self.base_url,
259 gsutil=self.gsutil,
260 num_threads=1,
261 directory=True,
262 recursive=False,
263 force=False,
264 output=None,
265 ignore_errors=False,
266 sha1_file=False)
267 expected_calls = [
268 ('check_call',
269 ('ls', input_filename)),
270 ('check_call',
271 ('cp', '-q', input_filename, output_filename))]
272 self.assertEquals(self.gsutil.history, expected_calls)
273 self.assertEquals(code, 0)
274
M-A Ruel 2013/03/11 19:52:01 2 lines
Ryan Tseng 2013/03/11 21:34:19 Done.
275 if __name__ == '__main__':
276 unittest.main()
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698