| Index: third_party/gsutil/gslib/addlhelp/security.py
|
| diff --git a/third_party/gsutil/gslib/addlhelp/security.py b/third_party/gsutil/gslib/addlhelp/security.py
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..da651e1a76c6f3ddd8d453560352da02017e2b49
|
| --- /dev/null
|
| +++ b/third_party/gsutil/gslib/addlhelp/security.py
|
| @@ -0,0 +1,216 @@
|
| +# -*- coding: utf-8 -*-
|
| +# Copyright 2015 Google Inc. All Rights Reserved.
|
| +#
|
| +# Licensed under the Apache License, Version 2.0 (the "License");
|
| +# you may not use this file except in compliance with the License.
|
| +# You may obtain a copy of the License at
|
| +#
|
| +# http://www.apache.org/licenses/LICENSE-2.0
|
| +#
|
| +# Unless required by applicable law or agreed to in writing, software
|
| +# distributed under the License is distributed on an "AS IS" BASIS,
|
| +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
| +# See the License for the specific language governing permissions and
|
| +# limitations under the License.
|
| +"""Additional help about types of credentials and authentication."""
|
| +
|
| +from __future__ import absolute_import
|
| +
|
| +from gslib.help_provider import HelpProvider
|
| +
|
| +_DETAILED_HELP_TEXT = ("""
|
| +<B>OVERVIEW</B>
|
| + This help section provides details about various precautions taken by gsutil
|
| + to protect data security, as well as recommendations for how customers should
|
| + safeguard security.
|
| +
|
| +
|
| +<B>TRANSPORT LAYER SECURITY</B>
|
| + gsutil performs all operations using transport-layer encryption (HTTPS), to
|
| + protect against data leakage over shared network links. This is also important
|
| + because gsutil uses "bearer tokens" for authentication (OAuth2) as well as for
|
| + resumable upload identifiers, and such tokens must be protected from being
|
| + eavesdropped and reused.
|
| +
|
| + gsutil also supports the older HMAC style of authentication via the XML API
|
| + (see "gsutil help apis"). While HMAC authentication does not use bearer
|
| + tokens (and thus is not subject to eavesdropping/replay attacks), it's still
|
| + important to encrypt data traffic.
|
| +
|
| + Prior to gsutil release 4.0 it was possible to use HTTP instead of HTTPS by
|
| + setting the "is_secure" configuration parameter in the [Boto] section of the
|
| + boto configuration file to False. However, starting with gsutil version 4.0
|
| + setting is_secure to False is disallowed. For more details about different
|
| + credential options, see "gsutil help creds".
|
| +
|
| +
|
| +<B>LOCAL FILE STORAGE SECURITY</B>
|
| + gsutil takes a number of precautions to protect against security exploits in
|
| + the files it stores locally:
|
| +
|
| + - When the gsutil config command runs it sets file protection mode 600
|
| + ("-rw-------") on the the .boto configuration file it generates, so only
|
| + the user (or superuser) can read it. This is important because these files
|
| + contain security-sensitive information, including credentials and proxy
|
| + configuration.
|
| +
|
| + - The gsutil config command also uses file protection mode 600 for the
|
| + private key file stored locally when you create service account
|
| + credentials.
|
| +
|
| + - The default level of logging output from gsutil commands does not include
|
| + security-sensitive information, such as OAuth2 tokens and proxy
|
| + configuration information. (See the "RECOMMENDED USER PRECAUTIONS" section
|
| + below if you increase the level of debug output, using the gsutil -D
|
| + option.)
|
| +
|
| + Note that protection modes are not supported on Windows, so if you
|
| + use gsutil on Windows we recommend using an encrypted file system and strong
|
| + account passwords.
|
| +
|
| +
|
| +<B>SECURITY-SENSITIVE FILES WRITTEN TEMPORARILY TO DISK BY GSUTIL</B>
|
| + gsutil buffers data in temporary files in several situations:
|
| +
|
| + - While compressing data being uploaded via gsutil cp -z, gsutil
|
| + buffers the data in temporary files with protection 600, which it
|
| + deletes after the upload is complete (similarly for downloading files
|
| + that were uploaded with gsutil cp -z or some other process that sets the
|
| + Content-Encoding to "gzip"). However, if you kill the gsutil process
|
| + while the upload is under way the partially written file will be left
|
| + in place. See the "CHANGING TEMP DIRECTORIES" section in
|
| + "gsutil help cp" for details of where the temporary files are written
|
| + and how to change the temp directory location.
|
| +
|
| + - When performing a resumable upload gsutil stores the upload ID (which,
|
| + as noted above, is a bearer token and thus should be safe-guarded) in a
|
| + file under ~/.gsutil/tracker-files with protection 600, and deletes this
|
| + file after the upload is complete. However, if the upload doesn't
|
| + complete successfully the tracker file is left in place so the resumable
|
| + upload can be re-attempted later. Over time it's possible to accumulate
|
| + these tracker files from aborted upload attempts, though resumable
|
| + upload IDs are only valid for 1 week, so the security risk only exists
|
| + for files less than that old. If you consider the risk of leaving
|
| + aborted upload IDs in the tracker directory too high you could modify
|
| + your upload scripts to delete the tracker files; or you could create a
|
| + cron job to clear the tracker directory periodically.
|
| +
|
| + - The gsutil rsync command stores temporary files (with protection 600)
|
| + containing the names, sizes, and checksums of source and destination
|
| + directories/buckets, which it deletes after the rsync is complete.
|
| + However, if you kill the gsutil process while the rsync is under way the
|
| + listing files will be left in place.
|
| +
|
| + Note that gsutil deletes temporary files using the standard OS unlink system
|
| + call, which does not perform `data wiping
|
| + <https://en.wikipedia.org/wiki/Data_erasure>`_. Thus, the content of such
|
| + temporary files can be recovered by a determined adversary.
|
| +
|
| +
|
| +<B>ACCESS CONTROL LISTS</B>
|
| + Unless you specify a different ACL (e.g., via the gsutil cp -a option), by
|
| + default objects written to a bucket use the default object ACL on that bucket.
|
| + Unless you modify that ACL (e.g., via the gsutil defacl command), by default
|
| + it will allow all project editors write access to the object and read/write
|
| + access to the object's metadata; and will allow all project viewers read
|
| + access to the object.
|
| +
|
| + The GCS access control system includes the ability to specify that objects are
|
| + publicly readable. Make sure you intend for any objects you write with this
|
| + permission to be public. Once "published", data on the Internet can be copied
|
| + to many places, so it's effectively impossible to regain read control over an
|
| + object written with this permission.
|
| +
|
| + The GCS access control system includes the ability to specify that buckets are
|
| + publicly writable. While configuring a bucket this way can be convenient for
|
| + various purposes, we recommend against using this permission - it can be
|
| + abused for distributing illegal content, viruses, and other malware, and the
|
| + bucket owner is legally and financially responsible for the content stored in
|
| + their buckets. If you need to make content available to customers who don't
|
| + have Google accounts consider instead using signed URLs (see
|
| + "gsutil help signurl").
|
| +
|
| +
|
| +<B>SOFTWARE INTEGRITY AND UPDATES</B>
|
| + gsutil is distributed as a standalone bundle via tar and zip files stored in
|
| + the gs://pub bucket, as a PyPi module, and as part of the bundled Cloud
|
| + SDK release. Each of these distribution methods takes a variety of security
|
| + precautions to protect the integrity of the software. We strongly recommend
|
| + against getting a copy of gsutil from any other sources (such as mirror
|
| + sites).
|
| +
|
| +
|
| +<B>PROXY USAGE</B>
|
| + gsutil supports access via proxies, such as Squid and a number of commercial
|
| + products. A full description of their capabilities is beyond the scope of this
|
| + documentation, but proxies can be configured to support many security-related
|
| + functions, including virus scanning, Data Leakage Prevention, control over
|
| + which certificates/CA's are trusted, content type filtering, and many more
|
| + capabilities. Some of these features can slow or block legitimate gsutil
|
| + behavior. For example, virus scanning depends on decrypting file content,
|
| + which in turn requires that the proxy terminate the gsutil connection and
|
| + establish a new connection - and in some cases proxies will rewrite content in
|
| + ways that result in checksum validation errors and other problems.
|
| +
|
| + For details on configuring proxies see the proxy help text in your .boto
|
| + configuration file (generated by the gsutil config command).
|
| +
|
| +
|
| +<B>ENCRYPTION AT REST</B>
|
| + All GCS data are stored encrypted. For more information see
|
| + `Server-Side Encryption
|
| + <https://cloud.google.com/storage/docs/concepts-techniques#encryption>`_.
|
| +
|
| +
|
| +<B>DATA PRIVACY FROM GOOGLE EMPLOYEES</B>
|
| + Google employees will never look at your data unless you first explicitly
|
| + grant them permission to do so while troubleshooting a specific incident.
|
| +
|
| + Google will never ask you to share your credentials, password, or other
|
| + security-sensitive information. Beware of potential phishing scams where
|
| + someone attempts to impersonate Google and asks for such information.
|
| +
|
| +
|
| +<B>MEASUREMENT DATA</B>
|
| + The gsutil perfdiag command collects a variety of performance-related
|
| + measurements and details about your local system and network environment, for
|
| + use in troubleshooting performance problems. None of this information will be
|
| + sent to Google unless you choose to send it.
|
| +
|
| +
|
| +<B>RECOMMENDED USER PRECAUTIONS</B>
|
| + The first and foremost precaution is: Never share your credentials. Each user
|
| + should have distinct credentials.
|
| +
|
| + If you run gsutil -D (to generate debugging output) it will include OAuth2
|
| + refresh and access tokens in the output. Make sure to redact this information
|
| + before sending this debug output to anyone during troubleshooting/tech support
|
| + interactions.
|
| +
|
| + The proxy configuration information in the .boto configuration is
|
| + security-sensitive, especially if your proxy setup requires user and
|
| + password information. Even if your proxy setup doesn't require user and
|
| + password, the host and port number for your proxy is often considered
|
| + security-sensitive. Protect access to your .boto configuration file.
|
| +
|
| + If you are using gsutil from a production environment (e.g., via a cron job
|
| + running on a host in your data center), use service account credentials rather
|
| + than individual user account credentials. These credentials were designed for
|
| + such use and, for example, protect you from losing access when an employee
|
| + leaves your company.
|
| +""")
|
| +
|
| +
|
| +class CommandOptions(HelpProvider):
|
| + """Additional help about security and privacy considerations using gsutil."""
|
| +
|
| + # Help specification. See help_provider.py for documentation.
|
| + help_spec = HelpProvider.HelpSpec(
|
| + help_name='security',
|
| + help_name_aliases=['encryption', 'protection', 'privacy', 'proxies',
|
| + 'proxy'],
|
| + help_type='additional_help',
|
| + help_one_line_summary='Security and Privacy Considerations',
|
| + help_text=_DETAILED_HELP_TEXT,
|
| + subcommand_help_text={},
|
| + )
|
|
|