| // -*- mode: c++ -*- |
| |
| // Copyright 2011 Google LLC |
| // |
| // Redistribution and use in source and binary forms, with or without |
| // modification, are permitted provided that the following conditions are |
| // met: |
| // |
| // * Redistributions of source code must retain the above copyright |
| // notice, this list of conditions and the following disclaimer. |
| // * Redistributions in binary form must reproduce the above |
| // copyright notice, this list of conditions and the following disclaimer |
| // in the documentation and/or other materials provided with the |
| // distribution. |
| // * Neither the name of Google LLC nor the names of its |
| // contributors may be used to endorse or promote products derived from |
| // this software without specific prior written permission. |
| // |
| // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| |
| // Author: Jim Blandy <[email protected]> <[email protected]> |
| |
| // dump_syms.h: Declaration of google_breakpad::DumpSymbols, a class for |
| // reading debugging information from Mach-O files and writing it out as a |
| // Breakpad symbol file. |
| |
| #include <mach-o/loader.h> |
| #include <stdio.h> |
| #include <stdlib.h> |
| |
| #include <ostream> |
| #include <string> |
| #include <vector> |
| |
| #include "common/byte_cursor.h" |
| #include "common/dwarf/dwarf2reader.h" |
| #include "common/mac/arch_utilities.h" |
| #include "common/mac/macho_reader.h" |
| #include "common/mac/super_fat_arch.h" |
| #include "common/module.h" |
| #include "common/scoped_ptr.h" |
| #include "common/symbol_data.h" |
| |
| namespace google_breakpad { |
| |
| class DumpSymbols { |
| public: |
| DumpSymbols(SymbolData symbol_data, |
| bool handle_inter_cu_refs, |
| bool enable_multiple = false, |
| const std::string& module_name = "", |
| bool prefer_extern_name = false) |
| : symbol_data_(symbol_data), |
| handle_inter_cu_refs_(handle_inter_cu_refs), |
| object_filename_(), |
| contents_(), |
| size_(0), |
| from_disk_(false), |
| object_files_(), |
| selected_object_file_(), |
| selected_object_name_(), |
| enable_multiple_(enable_multiple), |
| module_name_(module_name), |
| prefer_extern_name_(prefer_extern_name) {} |
| ~DumpSymbols() = default; |
| |
| // Prepare to read debugging information from |filename|. |filename| may be |
| // the name of a fat file, a Mach-O file, or a dSYM bundle containing either |
| // of the above. |
| // |
| // If |module_name_| is empty, uses the basename of |filename| as the module |
| // name. Otherwise, uses |module_name_| as the module name. |
| // |
| // On success, return true; if there is a problem reading |
| // |filename|, report it and return false. |
| bool Read(const std::string& filename); |
| |
| // Prepare to read debugging information from |contents|. |contents| is |
| // expected to be the data obtained from reading a fat file, or a Mach-O file. |
| // |filename| is used to determine the object filename in the generated |
| // output; there will not be an attempt to open this file as the data |
| // is already expected to be in memory. On success, return true; if there is a |
| // problem reading |contents|, report it and return false. |
| bool ReadData(uint8_t* contents, size_t size, const std::string& filename); |
| |
| // If this dumper's file includes an object file for `info`, then select that |
| // object file for dumping, and return true. Otherwise, return false, and |
| // leave this dumper's selected architecture unchanged. |
| // |
| // By default, if this dumper's file contains only one object file, then |
| // the dumper will dump those symbols; and if it contains more than one |
| // object file, then the dumper will dump the object file whose |
| // architecture matches that of this dumper program. |
| bool SetArchitecture(const ArchInfo& info); |
| |
| // Return a pointer to an array of SuperFatArch structures describing the |
| // object files contained in this dumper's file. Set *|count| to the number |
| // of elements in the array. The returned array is owned by this DumpSymbols |
| // instance. |
| // |
| // If there are no available architectures, this function |
| // may return NULL. |
| const SuperFatArch* AvailableArchitectures(size_t* count) { |
| *count = object_files_.size(); |
| if (object_files_.size() > 0) |
| return &object_files_[0]; |
| return NULL; |
| } |
| |
| // Read the selected object file's debugging information, and write out the |
| // header only to |stream|. Return true on success; if an error occurs, report |
| // it and return false. |
| bool WriteSymbolFileHeader(std::ostream& stream); |
| |
| // Read the selected object file's debugging information and store it in |
| // `module`. The caller owns the resulting module object and must delete |
| // it when finished. |
| bool ReadSymbolData(Module** module); |
| |
| // Return an identifier string for the file this DumpSymbols is dumping. |
| std::string Identifier(); |
| |
| private: |
| // Used internally. |
| class DumperLineToModule; |
| class DumperRangesHandler; |
| class LoadCommandDumper; |
| |
| // This method behaves similarly to NXFindBestFatArch, but it supports |
| // SuperFatArch. |
| SuperFatArch* FindBestMatchForArchitecture( |
| cpu_type_t cpu_type, cpu_subtype_t cpu_subtype); |
| |
| // Creates an empty module object. |
| bool CreateEmptyModule(scoped_ptr<Module>& module); |
| |
| // Process the split dwarf file referenced by reader. |
| void StartProcessSplitDwarf(google_breakpad::CompilationUnit* reader, |
| Module* module, |
| google_breakpad::Endianness endianness, |
| bool handle_inter_cu_refs, |
| bool handle_inline) const; |
| |
| // Read debugging information from |dwarf_sections|, which was taken from |
| // |macho_reader|, and add it to |module|. |
| void ReadDwarf(google_breakpad::Module* module, |
| const mach_o::Reader& macho_reader, |
| const mach_o::SectionMap& dwarf_sections, |
| bool handle_inter_cu_refs) const; |
| |
| // Read DWARF CFI or .eh_frame data from |section|, belonging to |
| // |macho_reader|, and record it in |module|. If |eh_frame| is true, |
| // then the data is .eh_frame-format data; otherwise, it is standard DWARF |
| // .debug_frame data. On success, return true; on failure, report |
| // the problem and return false. |
| bool ReadCFI(google_breakpad::Module* module, |
| const mach_o::Reader& macho_reader, |
| const mach_o::Section& section, |
| bool eh_frame) const; |
| |
| // The selection of what type of symbol data to read/write. |
| const SymbolData symbol_data_; |
| |
| // Whether to handle references between compilation units. |
| const bool handle_inter_cu_refs_; |
| |
| // The name of the file this DumpSymbols will actually read debugging |
| // information from. If the filename passed to Read refers to a dSYM bundle, |
| // then this is the resource file within that bundle. |
| std::string object_filename_; |
| |
| // The complete contents of object_filename_, mapped into memory. |
| scoped_array<uint8_t> contents_; |
| |
| // The size of contents_. |
| size_t size_; |
| |
| // Indicates which entry point to DumpSymbols was used, i.e. Read vs ReadData. |
| // This is used to indicate that downstream code paths can/should also read |
| // from disk or not. |
| bool from_disk_; |
| |
| // A vector of SuperFatArch structures describing the object files |
| // object_filename_ contains. If object_filename_ refers to a fat binary, |
| // this may have more than one element; if it refers to a Mach-O file, this |
| // has exactly one element. |
| vector<SuperFatArch> object_files_; |
| |
| // The object file in object_files_ selected to dump, or NULL if |
| // SetArchitecture hasn't been called yet. |
| const SuperFatArch* selected_object_file_; |
| |
| // A string that identifies the selected object file, for use in error |
| // messages. This is usually object_filename_, but if that refers to a |
| // fat binary, it includes an indication of the particular architecture |
| // within that binary. |
| string selected_object_name_; |
| |
| // Whether symbols sharing an address should be collapsed into a single entry |
| // and marked with an `m` in the output. |
| // See: https://crbug.com/google-breakpad/751 and docs at |
| // docs/symbol_files.md#records-3 |
| bool enable_multiple_; |
| |
| // If non-empty, used as the module name. Otherwise, the basename of |
| // |object_filename_| is used as the module name. |
| const std::string module_name_; |
| |
| // If a Function and an Extern share the same address but have a different |
| // name, prefer the name of the Extern. |
| // |
| // Use this when dumping Mach-O .dSYMs built with -gmlt (Minimum Line Tables), |
| // as the Function's fully-qualified name will only be present in the STABS |
| // (which are placed in the Extern), not in the DWARF symbols (which are |
| // placed in the Function). |
| bool prefer_extern_name_; |
| }; |
| |
| } // namespace google_breakpad |