OLD | NEW |
| (Empty) |
1 # Copyright 2011 Google Inc. All Rights Reserved. | |
2 # | |
3 # Licensed under the Apache License, Version 2.0 (the "License"); | |
4 # you may not use this file except in compliance with the License. | |
5 # You may obtain a copy of the License at | |
6 # | |
7 # http://www.apache.org/licenses/LICENSE-2.0 | |
8 # | |
9 # Unless required by applicable law or agreed to in writing, software | |
10 # distributed under the License is distributed on an "AS IS" BASIS, | |
11 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
12 # See the License for the specific language governing permissions and | |
13 # limitations under the License. | |
14 | |
15 import boto | |
16 | |
17 from boto.exception import GSResponseError | |
18 from gslib.command import Command | |
19 from gslib.command import COMMAND_NAME | |
20 from gslib.command import COMMAND_NAME_ALIASES | |
21 from gslib.command import CONFIG_REQUIRED | |
22 from gslib.command import FILE_URIS_OK | |
23 from gslib.command import MAX_ARGS | |
24 from gslib.command import MIN_ARGS | |
25 from gslib.command import PROVIDER_URIS_OK | |
26 from gslib.command import SUPPORTED_SUB_ARGS | |
27 from gslib.command import URIS_START_ARG | |
28 from gslib.exception import CommandException | |
29 from gslib.help_provider import HELP_NAME | |
30 from gslib.help_provider import HELP_NAME_ALIASES | |
31 from gslib.help_provider import HELP_ONE_LINE_SUMMARY | |
32 from gslib.help_provider import HELP_TEXT | |
33 from gslib.help_provider import HelpType | |
34 from gslib.help_provider import HELP_TYPE | |
35 from gslib.name_expansion import NameExpansionIterator | |
36 from gslib.util import NO_MAX | |
37 | |
38 _detailed_help_text = (""" | |
39 <B>SYNOPSIS</B> | |
40 gsutil rm [-f] [-R] uri... | |
41 | |
42 | |
43 <B>DESCRIPTION</B> | |
44 The gsutil rm command removes objects. | |
45 For example, the command: | |
46 | |
47 gsutil rm gs://bucket/subdir/* | |
48 | |
49 will remove all objects in gs://bucket/subdir, but not in any of its | |
50 sub-directories. In contrast: | |
51 | |
52 gsutil rm gs://bucket/subdir/** | |
53 | |
54 will remove all objects under gs://bucket/subdir or any of its | |
55 subdirectories. | |
56 | |
57 You can also use the -R option to specify recursive object deletion. Thus, for | |
58 example, the following two commands will both remove all objects in a bucket: | |
59 | |
60 gsutil rm gs://bucket/** | |
61 gsutil rm -R gs://bucket | |
62 | |
63 If you have a large number of objects to remove you might want to use the | |
64 gsutil -m option, to perform a parallel (multi-threaded/multi-processing) | |
65 removes: | |
66 | |
67 gsutil -m rm -R gs://my_bucket/subdir | |
68 | |
69 Note that gsutil rm will refuse to remove files from the local | |
70 file system. For example this will fail: | |
71 | |
72 gsutil rm *.txt | |
73 | |
74 | |
75 <B>OPTIONS</B> | |
76 -f Continues silently (without printing error messages) despite | |
77 errors when removing multiple objects. | |
78 | |
79 -R, -r Causes bucket contents to be removed recursively (i.e., including | |
80 all objects and subdirectories). Will not delete the bucket | |
81 itself; you need to run the gsutil rb command separately to do | |
82 that. | |
83 | |
84 -a Delete all versions of an object. | |
85 """) | |
86 | |
87 | |
88 class RmCommand(Command): | |
89 """Implementation of gsutil rm command.""" | |
90 | |
91 # Command specification (processed by parent class). | |
92 command_spec = { | |
93 # Name of command. | |
94 COMMAND_NAME : 'rm', | |
95 # List of command name aliases. | |
96 COMMAND_NAME_ALIASES : ['del', 'delete', 'remove'], | |
97 # Min number of args required by this command. | |
98 MIN_ARGS : 1, | |
99 # Max number of args required by this command, or NO_MAX. | |
100 MAX_ARGS : NO_MAX, | |
101 # Getopt-style string specifying acceptable sub args. | |
102 SUPPORTED_SUB_ARGS : 'afrRv', | |
103 # True if file URIs acceptable for this command. | |
104 FILE_URIS_OK : False, | |
105 # True if provider-only URIs acceptable for this command. | |
106 PROVIDER_URIS_OK : False, | |
107 # Index in args of first URI arg. | |
108 URIS_START_ARG : 0, | |
109 # True if must configure gsutil before running command. | |
110 CONFIG_REQUIRED : True, | |
111 } | |
112 help_spec = { | |
113 # Name of command or auxiliary help info for which this help applies. | |
114 HELP_NAME : 'rm', | |
115 # List of help name aliases. | |
116 HELP_NAME_ALIASES : ['del', 'delete', 'remove'], | |
117 # Type of help: | |
118 HELP_TYPE : HelpType.COMMAND_HELP, | |
119 # One line summary of this help. | |
120 HELP_ONE_LINE_SUMMARY : 'Remove objects', | |
121 # The full help text. | |
122 HELP_TEXT : _detailed_help_text, | |
123 } | |
124 | |
125 # Command entry point. | |
126 def RunCommand(self): | |
127 # self.recursion_requested initialized in command.py (so can be checked | |
128 # in parent class for all commands). | |
129 self.continue_on_error = False | |
130 self.all_versions = False | |
131 if self.sub_opts: | |
132 for o, unused_a in self.sub_opts: | |
133 if o == '-a': | |
134 self.all_versions = True | |
135 elif o == '-f': | |
136 self.continue_on_error = True | |
137 elif o == '-r' or o == '-R': | |
138 self.recursion_requested = True | |
139 elif o == '-v': | |
140 self.THREADED_LOGGER.info('WARNING: The %s -v option is no longer' | |
141 ' needed, and will eventually be removed.\n' | |
142 % self.command_name) | |
143 | |
144 # Used to track if any files failed to be removed. | |
145 self.everything_removed_okay = True | |
146 | |
147 # Tracks if any URIs matched the given args. | |
148 | |
149 remove_func = self._MkRemoveFunc() | |
150 exception_handler = self._MkRemoveExceptionHandler() | |
151 | |
152 try: | |
153 # Expand wildcards, dirs, buckets, and bucket subdirs in URIs. | |
154 name_expansion_iterator = NameExpansionIterator( | |
155 self.command_name, self.proj_id_handler, self.headers, self.debug, | |
156 self.bucket_storage_uri_class, self.args, self.recursion_requested, | |
157 flat=self.recursion_requested, all_versions=self.all_versions) | |
158 | |
159 # Perform remove requests in parallel (-m) mode, if requested, using | |
160 # configured number of parallel processes and threads. Otherwise, | |
161 # perform requests with sequential function calls in current process. | |
162 self.Apply(remove_func, name_expansion_iterator, exception_handler) | |
163 | |
164 # Assuming the bucket has versioning enabled, uri's that don't map to | |
165 # objects should throw an error even with all_versions, since the prior | |
166 # round of deletes only sends objects to a history table. | |
167 # This assumption that rm -a is only called for versioned buckets should be | |
168 # corrected, but the fix is non-trivial. | |
169 except CommandException as e: | |
170 if not self.continue_on_error: | |
171 raise | |
172 except GSResponseError, e: | |
173 if not self.continue_on_error: | |
174 raise | |
175 | |
176 if not self.everything_removed_okay and not self.continue_on_error: | |
177 raise CommandException('Some files could not be removed.') | |
178 | |
179 # If this was a gsutil rm -r command covering any bucket subdirs, | |
180 # remove any dir_$folder$ objects (which are created by various web UI | |
181 # tools to simulate folders). | |
182 if self.recursion_requested: | |
183 folder_object_wildcards = [] | |
184 for uri_str in self.args: | |
185 uri = self.suri_builder.StorageUri(uri_str) | |
186 if uri.names_object: | |
187 folder_object_wildcards.append('%s**_$folder$' % uri) | |
188 if len(folder_object_wildcards): | |
189 self.continue_on_error = True | |
190 try: | |
191 name_expansion_iterator = NameExpansionIterator( | |
192 self.command_name, self.proj_id_handler, self.headers, self.debug, | |
193 self.bucket_storage_uri_class, folder_object_wildcards, | |
194 self.recursion_requested, flat=True, | |
195 all_versions=self.all_versions) | |
196 self.Apply(remove_func, name_expansion_iterator, exception_handler) | |
197 except CommandException as e: | |
198 # Ignore exception from name expansion due to an absent folder file. | |
199 if not e.reason.startswith('No URIs matched:'): | |
200 raise | |
201 | |
202 return 0 | |
203 | |
204 def _MkRemoveExceptionHandler(self): | |
205 def RemoveExceptionHandler(e): | |
206 """Simple exception handler to allow post-completion status.""" | |
207 self.THREADED_LOGGER.error(str(e)) | |
208 self.everything_removed_okay = False | |
209 return RemoveExceptionHandler | |
210 | |
211 def _MkRemoveFunc(self): | |
212 def RemoveFunc(name_expansion_result): | |
213 exp_src_uri = self.suri_builder.StorageUri( | |
214 name_expansion_result.GetExpandedUriStr(), | |
215 is_latest=name_expansion_result.is_latest) | |
216 if exp_src_uri.names_container(): | |
217 if exp_src_uri.is_cloud_uri(): | |
218 # Before offering advice about how to do rm + rb, ensure those | |
219 # commands won't fail because of bucket naming problems. | |
220 boto.s3.connection.check_lowercase_bucketname(exp_src_uri.bucket_name) | |
221 uri_str = exp_src_uri.object_name.rstrip('/') | |
222 raise CommandException('"rm" command will not remove buckets. To ' | |
223 'delete this/these bucket(s) do:\n\tgsutil rm ' | |
224 '%s/*\n\tgsutil rb %s' % (uri_str, uri_str)) | |
225 | |
226 # Perform delete. | |
227 self.THREADED_LOGGER.info('Removing %s...', | |
228 name_expansion_result.expanded_uri_str) | |
229 try: | |
230 exp_src_uri.delete_key(validate=False, headers=self.headers) | |
231 | |
232 except: | |
233 if self.continue_on_error: | |
234 self.everything_removed_okay = False | |
235 else: | |
236 raise | |
237 return RemoveFunc | |
OLD | NEW |