| // Copyright (c) 2010 Google Inc. All Rights Reserved. |
| // |
| // Redistribution and use in source and binary forms, with or without |
| // modification, are permitted provided that the following conditions are |
| // met: |
| // |
| // * Redistributions of source code must retain the above copyright |
| // notice, this list of conditions and the following disclaimer. |
| // * Redistributions in binary form must reproduce the above |
| // copyright notice, this list of conditions and the following disclaimer |
| // in the documentation and/or other materials provided with the |
| // distribution. |
| // * Neither the name of Google Inc. nor the names of its |
| // contributors may be used to endorse or promote products derived from |
| // this software without specific prior written permission. |
| // |
| // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| |
| #include <assert.h> |
| #include <stdint.h> |
| #include <stdlib.h> |
| |
| #include "common/dwarf/bytereader-inl.h" |
| #include "common/dwarf/bytereader.h" |
| |
| namespace dwarf2reader { |
| |
| ByteReader::ByteReader(enum Endianness endian) |
| :offset_reader_(NULL), address_reader_(NULL), endian_(endian), |
| address_size_(0), offset_size_(0), |
| have_section_base_(), have_text_base_(), have_data_base_(), |
| have_function_base_() { } |
| |
| ByteReader::~ByteReader() { } |
| |
| void ByteReader::SetOffsetSize(uint8 size) { |
| offset_size_ = size; |
| assert(size == 4 || size == 8); |
| if (size == 4) { |
| this->offset_reader_ = &ByteReader::ReadFourBytes; |
| } else { |
| this->offset_reader_ = &ByteReader::ReadEightBytes; |
| } |
| } |
| |
| void ByteReader::SetAddressSize(uint8 size) { |
| address_size_ = size; |
| assert(size == 4 || size == 8); |
| if (size == 4) { |
| this->address_reader_ = &ByteReader::ReadFourBytes; |
| } else { |
| this->address_reader_ = &ByteReader::ReadEightBytes; |
| } |
| } |
| |
| uint64 ByteReader::ReadInitialLength(const uint8_t *start, size_t* len) { |
| const uint64 initial_length = ReadFourBytes(start); |
| start += 4; |
| |
| // In DWARF2/3, if the initial length is all 1 bits, then the offset |
| // size is 8 and we need to read the next 8 bytes for the real length. |
| if (initial_length == 0xffffffff) { |
| SetOffsetSize(8); |
| *len = 12; |
| return ReadOffset(start); |
| } else { |
| SetOffsetSize(4); |
| *len = 4; |
| } |
| return initial_length; |
| } |
| |
| bool ByteReader::ValidEncoding(DwarfPointerEncoding encoding) const { |
| if (encoding == DW_EH_PE_omit) return true; |
| if (encoding == DW_EH_PE_aligned) return true; |
| if ((encoding & 0x7) > DW_EH_PE_udata8) |
| return false; |
| if ((encoding & 0x70) > DW_EH_PE_funcrel) |
| return false; |
| return true; |
| } |
| |
| bool ByteReader::UsableEncoding(DwarfPointerEncoding encoding) const { |
| switch (encoding & 0x70) { |
| case DW_EH_PE_absptr: return true; |
| case DW_EH_PE_pcrel: return have_section_base_; |
| case DW_EH_PE_textrel: return have_text_base_; |
| case DW_EH_PE_datarel: return have_data_base_; |
| case DW_EH_PE_funcrel: return have_function_base_; |
| default: return false; |
| } |
| } |
| |
| uint64 ByteReader::ReadEncodedPointer(const uint8_t *buffer, |
| DwarfPointerEncoding encoding, |
| size_t *len) const { |
| // UsableEncoding doesn't approve of DW_EH_PE_omit, so we shouldn't |
| // see it here. |
| assert(encoding != DW_EH_PE_omit); |
| |
| // The Linux Standards Base 4.0 does not make this clear, but the |
| // GNU tools (gcc/unwind-pe.h; readelf/dwarf.c; gdb/dwarf2-frame.c) |
| // agree that aligned pointers are always absolute, machine-sized, |
| // machine-signed pointers. |
| if (encoding == DW_EH_PE_aligned) { |
| assert(have_section_base_); |
| |
| // We don't need to align BUFFER in *our* address space. Rather, we |
| // need to find the next position in our buffer that would be aligned |
| // when the .eh_frame section the buffer contains is loaded into the |
| // program's memory. So align assuming that buffer_base_ gets loaded at |
| // address section_base_, where section_base_ itself may or may not be |
| // aligned. |
| |
| // First, find the offset to START from the closest prior aligned |
| // address. |
| uint64 skew = section_base_ & (AddressSize() - 1); |
| // Now find the offset from that aligned address to buffer. |
| uint64 offset = skew + (buffer - buffer_base_); |
| // Round up to the next boundary. |
| uint64 aligned = (offset + AddressSize() - 1) & -AddressSize(); |
| // Convert back to a pointer. |
| const uint8_t *aligned_buffer = buffer_base_ + (aligned - skew); |
| // Finally, store the length and actually fetch the pointer. |
| *len = aligned_buffer - buffer + AddressSize(); |
| return ReadAddress(aligned_buffer); |
| } |
| |
| // Extract the value first, ignoring whether it's a pointer or an |
| // offset relative to some base. |
| uint64 offset; |
| switch (encoding & 0x0f) { |
| case DW_EH_PE_absptr: |
| // DW_EH_PE_absptr is weird, as it is used as a meaningful value for |
| // both the high and low nybble of encoding bytes. When it appears in |
| // the high nybble, it means that the pointer is absolute, not an |
| // offset from some base address. When it appears in the low nybble, |
| // as here, it means that the pointer is stored as a normal |
| // machine-sized and machine-signed address. A low nybble of |
| // DW_EH_PE_absptr does not imply that the pointer is absolute; it is |
| // correct for us to treat the value as an offset from a base address |
| // if the upper nybble is not DW_EH_PE_absptr. |
| offset = ReadAddress(buffer); |
| *len = AddressSize(); |
| break; |
| |
| case DW_EH_PE_uleb128: |
| offset = ReadUnsignedLEB128(buffer, len); |
| break; |
| |
| case DW_EH_PE_udata2: |
| offset = ReadTwoBytes(buffer); |
| *len = 2; |
| break; |
| |
| case DW_EH_PE_udata4: |
| offset = ReadFourBytes(buffer); |
| *len = 4; |
| break; |
| |
| case DW_EH_PE_udata8: |
| offset = ReadEightBytes(buffer); |
| *len = 8; |
| break; |
| |
| case DW_EH_PE_sleb128: |
| offset = ReadSignedLEB128(buffer, len); |
| break; |
| |
| case DW_EH_PE_sdata2: |
| offset = ReadTwoBytes(buffer); |
| // Sign-extend from 16 bits. |
| offset = (offset ^ 0x8000) - 0x8000; |
| *len = 2; |
| break; |
| |
| case DW_EH_PE_sdata4: |
| offset = ReadFourBytes(buffer); |
| // Sign-extend from 32 bits. |
| offset = (offset ^ 0x80000000ULL) - 0x80000000ULL; |
| *len = 4; |
| break; |
| |
| case DW_EH_PE_sdata8: |
| // No need to sign-extend; this is the full width of our type. |
| offset = ReadEightBytes(buffer); |
| *len = 8; |
| break; |
| |
| default: |
| abort(); |
| } |
| |
| // Find the appropriate base address. |
| uint64 base; |
| switch (encoding & 0x70) { |
| case DW_EH_PE_absptr: |
| base = 0; |
| break; |
| |
| case DW_EH_PE_pcrel: |
| assert(have_section_base_); |
| base = section_base_ + (buffer - buffer_base_); |
| break; |
| |
| case DW_EH_PE_textrel: |
| assert(have_text_base_); |
| base = text_base_; |
| break; |
| |
| case DW_EH_PE_datarel: |
| assert(have_data_base_); |
| base = data_base_; |
| break; |
| |
| case DW_EH_PE_funcrel: |
| assert(have_function_base_); |
| base = function_base_; |
| break; |
| |
| default: |
| abort(); |
| } |
| |
| uint64 pointer = base + offset; |
| |
| // Remove inappropriate upper bits. |
| if (AddressSize() == 4) |
| pointer = pointer & 0xffffffff; |
| else |
| assert(AddressSize() == sizeof(uint64)); |
| |
| return pointer; |
| } |
| |
| Endianness ByteReader::GetEndianness() const { |
| return endian_; |
| } |
| |
| } // namespace dwarf2reader |