OLD | NEW |
---|---|
(Empty) | |
1 #!/usr/bin/env python | |
2 # Copyright (c) 2012 The Chromium Authors. All rights reserved. | |
3 # Use of this source code is governed by a BSD-style license that can be | |
4 # found in the LICENSE file. | |
5 | |
6 """Unit tests for download_from_google_storage.py.""" | |
7 | |
8 import os | |
9 import sys | |
10 import unittest | |
11 import threading | |
12 import Queue | |
13 import optparse | |
14 | |
15 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__)))) | |
16 | |
17 import upload_to_google_storage | |
18 import download_from_google_storage | |
19 | |
20 # ../third_party/gsutil/gsutil | |
21 GSUTIL_DEFAULT_PATH = os.path.join( | |
22 os.path.dirname(os.path.dirname(os.path.abspath(__file__))), | |
23 'third_party', 'gsutil', 'gsutil') | |
24 | |
25 | |
26 class GsutilMock(object): | |
27 def __init__(self, path, boto_path=None, timeout=None): | |
28 self.path = path | |
29 self.timeout = timeout | |
30 self.boto_path = boto_path | |
31 self.expected = [] | |
32 self.history = [] | |
33 self.lock = threading.Lock() | |
34 | |
35 def add_expected(self, return_code, out, err): | |
36 self.expected.append((return_code, out, err)) | |
37 | |
38 def append_history(self, method, args): | |
39 self.history.append((method, args)) | |
40 | |
41 def call(self, *args): | |
42 with self.lock: | |
43 self.append_history('call', args) | |
44 if self.expected: | |
45 return self.expected.pop(0)[0] | |
46 else: | |
47 return 0 | |
48 | |
49 def check_call(self, *args): | |
50 with self.lock: | |
51 self.append_history('check_call', args) | |
52 if self.expected: | |
53 return self.expected.pop(0) | |
54 else: | |
55 return (0, '', '') | |
M-A Ruel
2013/03/11 19:52:01
Interesting, usually I keep a reference to the Tes
| |
56 | |
57 | |
58 class GstoolsUnitTests(unittest.TestCase): | |
59 def setUp(self): | |
60 self.base_path = os.path.join( | |
61 os.path.dirname(os.path.abspath(__file__)), 'gstools') | |
62 | |
63 def test_gsutil(self): | |
64 gsutil = download_from_google_storage.Gsutil(GSUTIL_DEFAULT_PATH) | |
65 self.assertEquals(gsutil.path, GSUTIL_DEFAULT_PATH) | |
M-A Ruel
2013/03/11 19:52:01
Please use assertEqual() for new code, as per:
htt
Ryan Tseng
2013/03/11 21:34:19
Done.
| |
66 code, _, err = gsutil.check_call() | |
67 self.assertEquals(code, 0) | |
68 self.assertEquals(err, '') | |
69 | |
70 def test_gsutil_version(self): | |
71 gsutil = download_from_google_storage.Gsutil(GSUTIL_DEFAULT_PATH) | |
72 _, _, err = gsutil.check_call('version') | |
73 err_lines = err.splitlines() | |
74 self.assertEquals(err_lines[0], 'gsutil version 3.25') | |
75 self.assertEquals( | |
76 err_lines[1], | |
77 'checksum ce71ac982f1148315e7fa65cff2f83e8 (OK)') | |
78 | |
79 def test_get_sha1(self): | |
80 lorem_ipsum = os.path.join(self.base_path, 'lorem_ipsum.txt') | |
81 self.assertEquals( | |
82 download_from_google_storage.get_sha1(lorem_ipsum), | |
83 '7871c8e24da15bad8b0be2c36edc9dc77e37727f') | |
84 | |
85 def test_get_md5(self): | |
86 lorem_ipsum = os.path.join(self.base_path, 'lorem_ipsum.txt') | |
87 self.assertEquals( | |
88 upload_to_google_storage.get_md5(lorem_ipsum), | |
89 '634d7c1ed3545383837428f031840a1e') | |
90 | |
91 def test_get_md5_cached_read(self): | |
92 lorem_ipsum = os.path.join(self.base_path, 'lorem_ipsum.txt') | |
93 # Use a fake 'stale' MD5 sum. Expected behavior is to return stale sum. | |
94 self.assertEquals( | |
95 upload_to_google_storage.get_md5_cached(lorem_ipsum), | |
96 '734d7c1ed3545383837428f031840a1e') | |
97 | |
98 def test_get_md5_cached_write(self): | |
99 lorem_ipsum2 = os.path.join(self.base_path, 'lorem_ipsum2.txt') | |
100 lorem_ipsum2_md5 = os.path.join(self.base_path, 'lorem_ipsum2.txt.md5') | |
101 if os.path.exists(lorem_ipsum2_md5): | |
102 os.remove(lorem_ipsum2_md5) | |
M-A Ruel
2013/03/11 19:52:01
Then use a temporary directory so no files are lea
Ryan Tseng
2013/03/11 21:34:19
Done.
| |
103 # Use a fake 'stale' MD5 sum. Expected behavior is to return stale sum. | |
104 self.assertEquals( | |
105 upload_to_google_storage.get_md5_cached(lorem_ipsum2), | |
106 '4c02d1eb455a0f22c575265d17b84b6d') | |
107 self.assertTrue(os.path.exists(lorem_ipsum2_md5)) | |
108 self.assertEquals( | |
109 open(lorem_ipsum2_md5, 'rb').read(), | |
110 '4c02d1eb455a0f22c575265d17b84b6d') | |
111 os.remove(lorem_ipsum2_md5) # Clean up. | |
112 self.assertFalse(os.path.exists(lorem_ipsum2_md5)) | |
113 | |
114 | |
115 class DownloadTests(unittest.TestCase): | |
116 def setUp(self): | |
117 self.gsutil = GsutilMock(GSUTIL_DEFAULT_PATH) | |
118 self.base_path = os.path.join( | |
119 os.path.dirname(os.path.abspath(__file__)), | |
M-A Ruel
2013/03/11 19:52:01
Use a file-level variable. This code would break i
Ryan Tseng
2013/03/11 21:34:19
Done.
| |
120 'gstools', | |
121 'download_test_data') | |
122 self.base_url = 'gs://sometesturl' | |
123 self.parser = optparse.OptionParser() | |
124 self.queue = Queue.Queue() | |
125 self.ret_codes = Queue.Queue() | |
126 self.lorem_ipsum = os.path.join(self.base_path, 'lorem_ipsum.txt') | |
127 self.lorem_ipsum_sha1 = '7871c8e24da15bad8b0be2c36edc9dc77e37727f' | |
128 self.maxDiff = None | |
129 | |
130 def test_enumerate_files_non_recursive(self): | |
131 queue_size = download_from_google_storage.enumerate_work_queue( | |
132 self.base_path, self.queue, True, False, False, None, False) | |
133 result = list(self.queue.queue) | |
134 expected_queue = [ | |
135 ('e6c4fbd4fe7607f3e6ebf68b2ea4ef694da7b4fe', | |
136 os.path.join(self.base_path, 'rootfolder_text.txt')), | |
137 ('7871c8e24da15bad8b0be2c36edc9dc77e37727f', | |
138 os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt'))] | |
139 for item in result: | |
140 self.assertTrue(item in expected_queue) | |
141 self.assertEquals(queue_size, 2) | |
142 | |
143 def test_enumerate_files_recursive(self): | |
144 queue_size = download_from_google_storage.enumerate_work_queue( | |
145 self.base_path, self.queue, True, True, False, None, False) | |
146 expected_queue = [ | |
147 ('e6c4fbd4fe7607f3e6ebf68b2ea4ef694da7b4fe', | |
148 os.path.join(self.base_path, 'rootfolder_text.txt')), | |
149 ('7871c8e24da15bad8b0be2c36edc9dc77e37727f', | |
150 os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt')), | |
151 ('b5415aa0b64006a95c0c409182e628881d6d6463', | |
152 os.path.join(self.base_path, 'subfolder', 'subfolder_text.txt'))] | |
153 result = list(self.queue.queue) | |
M-A Ruel
2013/03/11 19:52:01
self.assertEqual(sorted(expected_queue), sorted(se
Ryan Tseng
2013/03/11 21:34:19
Done. Keeping the queue_size check since its calc
| |
154 for item in result: | |
155 self.assertTrue(item in expected_queue) | |
156 self.assertEquals(queue_size, 3) | |
157 | |
158 def test_download_worker_single_file(self): | |
159 sha1_hash = '7871c8e24da15bad8b0be2c36edc9dc77e37727f' | |
160 input_filename = '%s/%s' % (self.base_url, sha1_hash) | |
161 output_filename = os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt') | |
162 self.queue.put((sha1_hash, output_filename)) | |
163 self.queue.put((None, None)) | |
164 stdout_queue = Queue.Queue() | |
165 # pylint: disable=W0212 | |
M-A Ruel
2013/03/11 19:52:01
You can disable it at file level. It'll save a few
Ryan Tseng
2013/03/11 21:34:19
Done.
| |
166 download_from_google_storage._downloader_worker_thread( | |
167 0, self.queue, False, self.base_url, self.gsutil, | |
168 stdout_queue, self.ret_codes) | |
169 expected_calls = [ | |
170 ('check_call', | |
171 ('ls', input_filename)), | |
172 ('check_call', | |
173 ('cp', '-q', input_filename, output_filename))] | |
174 expected_output = [ | |
175 '0> Downloading %s...' % output_filename] | |
176 expected_ret_codes = [] | |
177 self.assertEquals(list(stdout_queue.queue), expected_output) | |
178 self.assertEquals(self.gsutil.history, expected_calls) | |
179 self.assertEquals(list(self.ret_codes.queue), expected_ret_codes) | |
180 | |
181 def test_download_worker_skips_file(self): | |
182 sha1_hash = 'e6c4fbd4fe7607f3e6ebf68b2ea4ef694da7b4fe' | |
183 output_filename = os.path.join(self.base_path, 'rootfolder_text.txt') | |
184 self.queue.put((sha1_hash, output_filename)) | |
185 self.queue.put((None, None)) | |
186 stdout_queue = Queue.Queue() | |
187 # pylint: disable=W0212 | |
188 download_from_google_storage._downloader_worker_thread( | |
189 0, self.queue, False, self.base_url, self.gsutil, | |
190 stdout_queue, self.ret_codes) | |
191 expected_output = [ | |
192 '0> File %s exists and SHA1 matches. Skipping.' % output_filename | |
193 ] | |
194 self.assertEquals(list(stdout_queue.queue), expected_output) | |
195 self.assertEquals(self.gsutil.history, []) | |
196 | |
197 def test_download_worker_skips_not_found_file(self): | |
198 sha1_hash = '7871c8e24da15bad8b0be2c36edc9dc77e37727f' | |
199 input_filename = '%s/%s' % (self.base_url, sha1_hash) | |
200 output_filename = os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt') | |
201 self.queue.put((sha1_hash, output_filename)) | |
202 self.queue.put((None, None)) | |
203 stdout_queue = Queue.Queue() | |
204 self.gsutil.add_expected(1, '', '') # Return error when 'ls' is called. | |
205 # pylint: disable=W0212 | |
206 download_from_google_storage._downloader_worker_thread( | |
207 0, self.queue, False, self.base_url, self.gsutil, | |
208 stdout_queue, self.ret_codes) | |
209 expected_output = [ | |
210 '0> File %s for %s does not exist, skipping.' % ( | |
211 input_filename, output_filename), | |
212 ] | |
213 expected_calls = [ | |
214 ('check_call', | |
215 ('ls', input_filename)) | |
216 ] | |
217 expected_ret_codes = [ | |
218 (1, 'File %s for %s does not exist.' % ( | |
219 input_filename, output_filename)) | |
220 ] | |
221 self.assertEquals(list(stdout_queue.queue), expected_output) | |
222 self.assertEquals(self.gsutil.history, expected_calls) | |
223 self.assertEquals(list(self.ret_codes.queue), expected_ret_codes) | |
224 | |
225 def test_download_cp_fails(self): | |
226 sha1_hash = '7871c8e24da15bad8b0be2c36edc9dc77e37727f' | |
227 input_filename = '%s/%s' % (self.base_url, sha1_hash) | |
228 output_filename = os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt') | |
229 self.gsutil.add_expected(0, '', '') | |
230 self.gsutil.add_expected(101, '', 'Test error message.') | |
231 # pylint: disable=W0212 | |
232 code = download_from_google_storage.download_from_google_storage( | |
233 input_filename=sha1_hash, | |
234 base_url=self.base_url, | |
235 gsutil=self.gsutil, | |
236 num_threads=1, | |
237 directory=False, | |
238 recursive=False, | |
239 force=True, | |
240 output=output_filename, | |
241 ignore_errors=False, | |
242 sha1_file=False) | |
243 expected_calls = [ | |
244 ('check_call', | |
245 ('ls', input_filename)), | |
246 ('check_call', | |
247 ('cp', '-q', input_filename, output_filename)) | |
248 ] | |
249 self.assertEquals(self.gsutil.history, expected_calls) | |
250 self.assertEquals(code, 101) | |
251 | |
252 def test_download_directory_no_recursive_non_force(self): | |
253 sha1_hash = '7871c8e24da15bad8b0be2c36edc9dc77e37727f' | |
254 input_filename = '%s/%s' % (self.base_url, sha1_hash) | |
255 output_filename = os.path.join(self.base_path, 'uploaded_lorem_ipsum.txt') | |
256 code = download_from_google_storage.download_from_google_storage( | |
257 input_filename=self.base_path, | |
258 base_url=self.base_url, | |
259 gsutil=self.gsutil, | |
260 num_threads=1, | |
261 directory=True, | |
262 recursive=False, | |
263 force=False, | |
264 output=None, | |
265 ignore_errors=False, | |
266 sha1_file=False) | |
267 expected_calls = [ | |
268 ('check_call', | |
269 ('ls', input_filename)), | |
270 ('check_call', | |
271 ('cp', '-q', input_filename, output_filename))] | |
272 self.assertEquals(self.gsutil.history, expected_calls) | |
273 self.assertEquals(code, 0) | |
274 | |
M-A Ruel
2013/03/11 19:52:01
2 lines
Ryan Tseng
2013/03/11 21:34:19
Done.
| |
275 if __name__ == '__main__': | |
276 unittest.main() | |
OLD | NEW |