| // -*- mode: C++ -*- |
| |
| // Copyright (c) 2010, Google Inc. |
| // All rights reserved. |
| // |
| // Redistribution and use in source and binary forms, with or without |
| // modification, are permitted provided that the following conditions are |
| // met: |
| // |
| // * Redistributions of source code must retain the above copyright |
| // notice, this list of conditions and the following disclaimer. |
| // * Redistributions in binary form must reproduce the above |
| // copyright notice, this list of conditions and the following disclaimer |
| // in the documentation and/or other materials provided with the |
| // distribution. |
| // * Neither the name of Google Inc. nor the names of its |
| // contributors may be used to endorse or promote products derived from |
| // this software without specific prior written permission. |
| // |
| // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| |
| // Original author: Jim Blandy <jimb@mozilla.com> <jimb@red-bean.com> |
| |
| // cfi_assembler.h: Define CFISection, a class for creating properly |
| // (and improperly) formatted DWARF CFI data for unit tests. |
| |
| #ifndef PROCESSOR_CFI_ASSEMBLER_H_ |
| #define PROCESSOR_CFI_ASSEMBLER_H_ |
| |
| #include <string> |
| |
| #include "common/dwarf/dwarf2enums.h" |
| #include "common/test_assembler.h" |
| #include "common/using_std_string.h" |
| #include "google_breakpad/common/breakpad_types.h" |
| |
| namespace google_breakpad { |
| |
| using dwarf2reader::DwarfPointerEncoding; |
| using google_breakpad::test_assembler::Endianness; |
| using google_breakpad::test_assembler::Label; |
| using google_breakpad::test_assembler::Section; |
| |
| class CFISection: public Section { |
| public: |
| |
| // CFI augmentation strings beginning with 'z', defined by the |
| // Linux/IA-64 C++ ABI, can specify interesting encodings for |
| // addresses appearing in FDE headers and call frame instructions (and |
| // for additional fields whose presence the augmentation string |
| // specifies). In particular, pointers can be specified to be relative |
| // to various base address: the start of the .text section, the |
| // location holding the address itself, and so on. These allow the |
| // frame data to be position-independent even when they live in |
| // write-protected pages. These variants are specified at the |
| // following two URLs: |
| // |
| // http://refspecs.linux-foundation.org/LSB_4.0.0/LSB-Core-generic/LSB-Core-generic/dwarfext.html |
| // http://refspecs.linux-foundation.org/LSB_4.0.0/LSB-Core-generic/LSB-Core-generic/ehframechpt.html |
| // |
| // CFISection leaves the production of well-formed 'z'-augmented CIEs and |
| // FDEs to the user, but does provide EncodedPointer, to emit |
| // properly-encoded addresses for a given pointer encoding. |
| // EncodedPointer uses an instance of this structure to find the base |
| // addresses it should use; you can establish a default for all encoded |
| // pointers appended to this section with SetEncodedPointerBases. |
| struct EncodedPointerBases { |
| EncodedPointerBases() : cfi(), text(), data() { } |
| |
| // The starting address of this CFI section in memory, for |
| // DW_EH_PE_pcrel. DW_EH_PE_pcrel pointers may only be used in data |
| // that has is loaded into the program's address space. |
| uint64_t cfi; |
| |
| // The starting address of this file's .text section, for DW_EH_PE_textrel. |
| uint64_t text; |
| |
| // The starting address of this file's .got or .eh_frame_hdr section, |
| // for DW_EH_PE_datarel. |
| uint64_t data; |
| }; |
| |
| // Create a CFISection whose endianness is ENDIANNESS, and where |
| // machine addresses are ADDRESS_SIZE bytes long. If EH_FRAME is |
| // true, use the .eh_frame format, as described by the Linux |
| // Standards Base Core Specification, instead of the DWARF CFI |
| // format. |
| CFISection(Endianness endianness, size_t address_size, |
| bool eh_frame = false) |
| : Section(endianness), address_size_(address_size), eh_frame_(eh_frame), |
| pointer_encoding_(dwarf2reader::DW_EH_PE_absptr), |
| encoded_pointer_bases_(), entry_length_(NULL), in_fde_(false) { |
| // The 'start', 'Here', and 'Mark' members of a CFISection all refer |
| // to section offsets. |
| start() = 0; |
| } |
| |
| // Return this CFISection's address size. |
| size_t AddressSize() const { return address_size_; } |
| |
| // Return true if this CFISection uses the .eh_frame format, or |
| // false if it contains ordinary DWARF CFI data. |
| bool ContainsEHFrame() const { return eh_frame_; } |
| |
| // Use ENCODING for pointers in calls to FDEHeader and EncodedPointer. |
| void SetPointerEncoding(DwarfPointerEncoding encoding) { |
| pointer_encoding_ = encoding; |
| } |
| |
| // Use the addresses in BASES as the base addresses for encoded |
| // pointers in subsequent calls to FDEHeader or EncodedPointer. |
| // This function makes a copy of BASES. |
| void SetEncodedPointerBases(const EncodedPointerBases& bases) { |
| encoded_pointer_bases_ = bases; |
| } |
| |
| // Append a Common Information Entry header to this section with the |
| // given values. If dwarf64 is true, use the 64-bit DWARF initial |
| // length format for the CIE's initial length. Return a reference to |
| // this section. You should call FinishEntry after writing the last |
| // instruction for the CIE. |
| // |
| // Before calling this function, you will typically want to use Mark |
| // or Here to make a label to pass to FDEHeader that refers to this |
| // CIE's position in the section. |
| CFISection& CIEHeader(uint64_t code_alignment_factor, |
| int data_alignment_factor, |
| unsigned return_address_register, |
| uint8_t version = 3, |
| const string& augmentation = "", |
| bool dwarf64 = false, |
| uint8_t address_size = 8, |
| uint8_t segment_size = 0); |
| |
| // Append a Frame Description Entry header to this section with the |
| // given values. If dwarf64 is true, use the 64-bit DWARF initial |
| // length format for the CIE's initial length. Return a reference to |
| // this section. You should call FinishEntry after writing the last |
| // instruction for the CIE. |
| // |
| // This function doesn't support entries that are longer than |
| // 0xffffff00 bytes. (The "initial length" is always a 32-bit |
| // value.) Nor does it support .debug_frame sections longer than |
| // 0xffffff00 bytes. |
| CFISection& FDEHeader(Label cie_pointer, |
| uint64_t initial_location, |
| uint64_t address_range, |
| bool dwarf64 = false); |
| |
| // Note the current position as the end of the last CIE or FDE we |
| // started, after padding with DW_CFA_nops for alignment. This |
| // defines the label representing the entry's length, cited in the |
| // entry's header. Return a reference to this section. |
| CFISection& FinishEntry(); |
| |
| // Append the contents of BLOCK as a DW_FORM_block value: an |
| // unsigned LEB128 length, followed by that many bytes of data. |
| CFISection& Block(const string& block) { |
| ULEB128(block.size()); |
| Append(block); |
| return *this; |
| } |
| |
| // Append ADDRESS to this section, in the appropriate size and |
| // endianness. Return a reference to this section. |
| CFISection& Address(uint64_t address) { |
| Section::Append(endianness(), address_size_, address); |
| return *this; |
| } |
| CFISection& Address(Label address) { |
| Section::Append(endianness(), address_size_, address); |
| return *this; |
| } |
| |
| // Append ADDRESS to this section, using ENCODING and BASES. ENCODING |
| // defaults to this section's default encoding, established by |
| // SetPointerEncoding. BASES defaults to this section's bases, set by |
| // SetEncodedPointerBases. If the DW_EH_PE_indirect bit is set in the |
| // encoding, assume that ADDRESS is where the true address is stored. |
| // Return a reference to this section. |
| // |
| // (C++ doesn't let me use default arguments here, because I want to |
| // refer to members of *this in the default argument expression.) |
| CFISection& EncodedPointer(uint64_t address) { |
| return EncodedPointer(address, pointer_encoding_, encoded_pointer_bases_); |
| } |
| CFISection& EncodedPointer(uint64_t address, DwarfPointerEncoding encoding) { |
| return EncodedPointer(address, encoding, encoded_pointer_bases_); |
| } |
| CFISection& EncodedPointer(uint64_t address, DwarfPointerEncoding encoding, |
| const EncodedPointerBases& bases); |
| |
| // Restate some member functions, to keep chaining working nicely. |
| CFISection& Mark(Label* label) { Section::Mark(label); return *this; } |
| CFISection& D8(uint8_t v) { Section::D8(v); return *this; } |
| CFISection& D16(uint16_t v) { Section::D16(v); return *this; } |
| CFISection& D16(Label v) { Section::D16(v); return *this; } |
| CFISection& D32(uint32_t v) { Section::D32(v); return *this; } |
| CFISection& D32(const Label& v) { Section::D32(v); return *this; } |
| CFISection& D64(uint64_t v) { Section::D64(v); return *this; } |
| CFISection& D64(const Label& v) { Section::D64(v); return *this; } |
| CFISection& LEB128(long long v) { Section::LEB128(v); return *this; } |
| CFISection& ULEB128(uint64_t v) { Section::ULEB128(v); return *this; } |
| |
| private: |
| // A length value that we've appended to the section, but is not yet |
| // known. LENGTH is the appended value; START is a label referring |
| // to the start of the data whose length was cited. |
| struct PendingLength { |
| Label length; |
| Label start; |
| }; |
| |
| // Constants used in CFI/.eh_frame data: |
| |
| // If the first four bytes of an "initial length" are this constant, then |
| // the data uses the 64-bit DWARF format, and the length itself is the |
| // subsequent eight bytes. |
| static const uint32_t kDwarf64InitialLengthMarker = 0xffffffffU; |
| |
| // The CIE identifier for 32- and 64-bit DWARF CFI and .eh_frame data. |
| static const uint32_t kDwarf32CIEIdentifier = ~(uint32_t)0; |
| static const uint64_t kDwarf64CIEIdentifier = ~(uint64_t)0; |
| static const uint32_t kEHFrame32CIEIdentifier = 0; |
| static const uint64_t kEHFrame64CIEIdentifier = 0; |
| |
| // The size of a machine address for the data in this section. |
| size_t address_size_; |
| |
| // If true, we are generating a Linux .eh_frame section, instead of |
| // a standard DWARF .debug_frame section. |
| bool eh_frame_; |
| |
| // The encoding to use for FDE pointers. |
| DwarfPointerEncoding pointer_encoding_; |
| |
| // The base addresses to use when emitting encoded pointers. |
| EncodedPointerBases encoded_pointer_bases_; |
| |
| // The length value for the current entry. |
| // |
| // Oddly, this must be dynamically allocated. Labels never get new |
| // values; they only acquire constraints on the value they already |
| // have, or assert if you assign them something incompatible. So |
| // each header needs truly fresh Label objects to cite in their |
| // headers and track their positions. The alternative is explicit |
| // destructor invocation and a placement new. Ick. |
| PendingLength *entry_length_; |
| |
| // True if we are currently emitting an FDE --- that is, we have |
| // called FDEHeader but have not yet called FinishEntry. |
| bool in_fde_; |
| |
| // If in_fde_ is true, this is its starting address. We use this for |
| // emitting DW_EH_PE_funcrel pointers. |
| uint64_t fde_start_address_; |
| }; |
| |
| } // namespace google_breakpad |
| |
| #endif // PROCESSOR_CFI_ASSEMBLER_H_ |