Index: util/mac/mach_o_image_reader.h |
diff --git a/util/mac/mach_o_image_reader.h b/util/mac/mach_o_image_reader.h |
new file mode 100644 |
index 0000000000000000000000000000000000000000..eb2435486361172dc7def5e4aa240768e724bda3 |
--- /dev/null |
+++ b/util/mac/mach_o_image_reader.h |
@@ -0,0 +1,279 @@ |
+// Copyright 2014 The Crashpad Authors. All rights reserved. |
+// |
+// Licensed under the Apache License, Version 2.0 (the "License"); |
+// you may not use this file except in compliance with the License. |
+// You may obtain a copy of the License at |
+// |
+// http://www.apache.org/licenses/LICENSE-2.0 |
+// |
+// Unless required by applicable law or agreed to in writing, software |
+// distributed under the License is distributed on an "AS IS" BASIS, |
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
+// See the License for the specific language governing permissions and |
+// limitations under the License. |
+ |
+#ifndef CRASHPAD_UTIL_MAC_MACH_O_IMAGE_READER_H_ |
+#define CRASHPAD_UTIL_MAC_MACH_O_IMAGE_READER_H_ |
+ |
+#include <mach/mach.h> |
+#include <stdint.h> |
+ |
+#include <map> |
+#include <string> |
+ |
+#include "base/basictypes.h" |
+#include "base/memory/scoped_ptr.h" |
+#include "util/misc/initialization_state_dcheck.h" |
+#include "util/misc/uuid.h" |
+#include "util/stdlib/pointer_container.h" |
+#include "util/mac/process_types.h" |
+ |
+namespace crashpad { |
+ |
+class MachOImageSegmentReader; |
+class ProcessReader; |
+ |
+//! \brief A reader for Mach-O images mapped into another process. |
+//! |
+//! This class is capable of reading both 32-bit (`mach_header`/`MH_MAGIC`) and |
+//! 64-bit (`mach_header_64`/`MH_MAGIC_64`) images based on the bitness of the |
+//! remote process. |
+class MachOImageReader { |
+ public: |
+ MachOImageReader(); |
+ ~MachOImageReader(); |
+ |
+ //! \brief Reads the Mach-O image file’s load commands from another process. |
+ //! |
+ //! This method must only be called once on an object. This method must be |
+ //! called successfully before any other method in this class may be called. |
+ //! |
+ //! \param[in] process_reader The reader for the remote process. |
+ //! \param[in] address The address, in the remote process’ address space, |
+ //! where the `mach_header` or `mach_header_64` at the beginning of the |
+ //! image to be read is located. This address can be determined by reading |
+ //! the remote process’ dyld information (see |
+ //! util/mac/process_types/dyld_images.proctype). |
+ //! \param[in] name The module’s name, a string to be used in logged messages. |
+ //! This string is for diagnostic purposes only, and may be empty. |
+ //! |
+ //! \return `true` if the image was read successfully, including all load |
+ //! commands. `false` otherwise, with an appropriate message logged. |
+ bool Initialize(ProcessReader* process_reader, |
+ mach_vm_address_t address, |
+ const std::string& name); |
+ |
+ //! \brief Returns the Mach-O file type. |
+ //! |
+ //! This value comes from the `filetype` field of the `mach_header` or |
+ //! `mach_header_64`. Common values include `MH_EXECUTE`, `MH_DYLIB`, |
+ //! `MH_DYLINKER`, and `MH_BUNDLE`. |
+ uint32_t FileType() const { return file_type_; } |
+ |
+ //! \brief Returns the Mach-O image’s load address. |
+ //! |
+ //! This is the value passed as \a address to Initialize(). |
+ mach_vm_address_t Address() const { return address_; } |
+ |
+ //! \brief Returns the mapped size of the Mach-O image’s __TEXT segment. |
+ //! |
+ //! Note that this is returns only the size of the __TEXT segment, not of any |
+ //! other segment. This is because the interface only allows one load address |
+ //! and size to be reported, but Mach-O image files may consist of multiple |
+ //! discontiguous segments. By convention, the __TEXT segment is always mapped |
+ //! at the beginning of a Mach-O image file, and it is the most useful for the |
+ //! expected intended purpose of collecting data to obtain stack backtraces. |
+ //! The implementation insists during initialization that the __TEXT segment |
+ //! be mapped at the beginning of the file. |
+ //! |
+ //! In practice, discontiguous segments are only found for images that have |
+ //! loaded out of the dyld shared cache, but the __TEXT segment’s size is |
+ //! returned for modules that loaded with contiguous segments as well for |
+ //! consistency. |
+ mach_vm_size_t Size() const { return size_; } |
+ |
+ //! \brief Returns the Mach-O image’s “slide,” the difference between its |
+ //! actual load address and its preferred load address. |
+ //! |
+ //! “Slide” is computed by subtracting the __TEXT segment’s preferred load |
+ //! address from its actual load address. It will be reported as a positive |
+ //! offset when the actual load address is greater than the preferred load |
+ //! address. The preferred load address is taken to be the segment’s reported |
+ //! `vmaddr` value. |
+ mach_vm_size_t Slide() const { return slide_; } |
+ |
+ //! \brief Obtain segment information by segment name. |
+ //! |
+ //! \param[in] segment_name The name of the segment to search for, for |
+ //! example, `"__TEXT"`. |
+ //! \param[out] address The actual address that the segment was loaded at in |
+ //! memory, taking any “slide” into account if the segment did not load at |
+ //! its preferred address as stored in the Mach-O image file. This |
+ //! parameter can be `NULL`. |
+ //! \param[out] size The actual size of the segment as loaded at in memory. |
+ //! This value takes any expansion of the segment into account, which |
+ //! occurs when a nonsliding segment in a sliding image loads at its |
+ //! preferred address but grows by the value of the slide. This parameter |
+ //! can be `NULL`. |
+ //! |
+ //! \return A pointer to the segment information if it was found, or `NULL` if |
+ //! it was not found. |
+ //! |
+ //! \note The \a address parameter takes “slide” into account, and the \a size |
+ //! parameter takes growth into account for non-sliding segments, so that |
+ //! these parameters reflect the actual address and size of the segment as |
+ //! loaded into a process’ address space. This is distinct from the |
+ //! segment’s preferred load address and size, which may be obtained by |
+ //! calling MachOImageSegmentReader::vmaddr() and |
+ //! MachOImageSegmentReader::vmsize(), respectively. |
+ const MachOImageSegmentReader* GetSegmentByName( |
+ const std::string& segment_name, |
+ mach_vm_address_t* address, |
+ mach_vm_size_t* size) const; |
+ |
+ //! \brief Obtain section information by segment and section name. |
+ //! |
+ //! \param[in] segment_name The name of the segment to search for, for |
+ //! example, `"__TEXT"`. |
+ //! \param[in] section_name The name of the section within the segment to |
+ //! search for, for example, `"__text"`. |
+ //! \param[out] address The actual address that the section was loaded at in |
+ //! memory, taking any “slide” into account if the section did not load at |
+ //! its preferred address as stored in the Mach-O image file. This |
+ //! parameter can be `NULL`. |
+ //! |
+ //! \return A pointer to the section information if it was found, or `NULL` if |
+ //! it was not found. |
+ //! |
+ //! No parameter is provided for the section’s size, because it can be |
+ //! obtained from the returned process_types::section::size field. |
+ //! |
+ //! \note The process_types::section::addr field gives the section’s preferred |
+ //! load address as stored in the Mach-O image file, and is not adjusted |
+ //! for any “slide” that may have occurred when the image was loaded. Use |
+ //! \a address to obtain the section’s actual load address. |
+ const process_types::section* GetSectionByName( |
+ const std::string& segment_name, |
+ const std::string& section_name, |
+ mach_vm_address_t* address) const; |
+ |
+ //! \brief Obtain section information by section index. |
+ //! |
+ //! \param[in] index The index of the section to return, in the order that it |
+ //! appears in the segment load commands. This is a 1-based index, |
+ //! matching the section number values used for `nlist::n_sect`. |
+ //! \param[out] address The actual address that the section was loaded at in |
+ //! memory, taking any “slide” into account if the section did not load at |
+ //! its preferred address as stored in the Mach-O image file. This |
+ //! parameter can be `NULL`. |
+ //! |
+ //! \return A pointer to the section information. If \a index is out of range, |
+ //! logs a warning and returns `NULL`. |
+ //! |
+ //! No parameter is provided for the section’s size, because it can be |
+ //! obtained from the returned process_types::section::size field. |
+ //! |
+ //! \note The process_types::section::addr field gives the section’s preferred |
+ //! load address as stored in the Mach-O image file, and is not adjusted |
+ //! for any “slide” that may have occurred when the image was loaded. Use |
+ //! \a address to obtain the section’s actual load address. |
+ //! \note Unlike MachOImageSegmentReader::GetSectionAtIndex(), this method |
+ //! accepts out-of-range values for \a index, and returns `NULL` instead |
+ //! of aborting execution upon encountering an out-of-range value. This is |
+ //! because a Mach-O image file’s symbol table refers to this per-module |
+ //! section index, and an out-of-range index in that case should be |
+ //! treated as a data error (where the data is beyond this code’s control) |
+ //! and handled non-fatally by reporting the error to the caller. |
+ const process_types::section* GetSectionAtIndex( |
+ size_t index, |
+ mach_vm_address_t* address) const; |
+ |
+ //! \brief Returns a Mach-O dylib image’s current version. |
+ //! |
+ //! This information comes from the `dylib_current_version` field of a dylib’s |
+ //! `LC_ID_DYLIB` load command. For dylibs without this load command, `0` will |
+ //! be returned. |
+ //! |
+ //! This method may only be called on Mach-O images for which FileType() |
+ //! returns `MH_DYLIB`. |
+ uint32_t DylibVersion() const; |
+ |
+ //! \brief Returns a Mach-O image’s source version. |
+ //! |
+ //! This information comes from a Mach-O image’s `LC_SOURCE_VERSION` load |
+ //! command. For Mach-O images without this load command, `0` will be |
+ //! returned. |
+ uint64_t SourceVersion() const { return source_version_; } |
+ |
+ //! \brief Returns a Mach-O image’s UUID. |
+ //! |
+ //! This information comes from a Mach-O image’s `LC_UUID` load command. For |
+ //! Mach-O images without this load command, a zeroed-out UUID value will be |
+ //! returned. |
+ // |
+ // UUID is a name in this scope (referring to this method), so the parameter’s |
+ // type needs to be qualified with |crashpad::|. |
+ void UUID(crashpad::UUID* uuid) const; |
+ |
+ //! \brief Returns the dynamic linker’s pathname. |
+ //! |
+ //! The dynamic linker is normally /usr/lib/dyld. |
+ //! |
+ //! For executable images (those with file type `MH_EXECUTE`), this is the |
+ //! name provided in the `LC_LOAD_DYLINKER` load command, if any. For dynamic |
+ //! linker images (those with file type `MH_DYLINKER`), this is the name |
+ //! provided in the `LC_ID_DYLINKER` load command. In other cases, this will |
+ //! be empty. |
+ std::string DylinkerName() const { return dylinker_name_; } |
+ |
+ private: |
+ // A generic helper routine for the other Read*Command() methods. |
+ template <typename T> |
+ bool ReadLoadCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info, |
+ uint32_t expected_load_command_id, |
+ T* load_command); |
+ |
+ // The Read*Command() methods are subroutines called by Initialize(). They are |
+ // responsible for reading a single load command. They may update the member |
+ // fields of their MachOImageReader object. If they can’t make sense of a load |
+ // command, they return false. |
+ bool ReadSegmentCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info); |
+ bool ReadSymTabCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info); |
+ bool ReadDySymTabCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info); |
+ bool ReadIdDylibCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info); |
+ bool ReadDylinkerCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info); |
+ bool ReadUUIDCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info); |
+ bool ReadSourceVersionCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info); |
+ bool ReadUnexpectedCommand(mach_vm_address_t load_command_address, |
+ const std::string& load_command_info); |
+ |
+ PointerVector<MachOImageSegmentReader> segments_; |
+ std::map<std::string, size_t> segment_map_; |
+ std::string module_info_; |
+ std::string dylinker_name_; |
+ crashpad::UUID uuid_; |
+ mach_vm_address_t address_; |
+ mach_vm_size_t size_; |
+ mach_vm_size_t slide_; |
+ uint64_t source_version_; |
+ scoped_ptr<process_types::symtab_command> symtab_command_; |
+ scoped_ptr<process_types::dysymtab_command> dysymtab_command_; |
+ scoped_ptr<process_types::dylib_command> id_dylib_command_; |
+ ProcessReader* process_reader_; // weak |
+ uint32_t file_type_; |
+ InitializationStateDcheck initialized_; |
+ |
+ DISALLOW_COPY_AND_ASSIGN(MachOImageReader); |
+}; |
+ |
+} // namespace crashpad |
+ |
+#endif // CRASHPAD_UTIL_MAC_MACH_O_IMAGE_READER_H_ |