|  | // Copyright (c) 2006, Google Inc. | 
|  | // All rights reserved. | 
|  | // | 
|  | // Redistribution and use in source and binary forms, with or without | 
|  | // modification, are permitted provided that the following conditions are | 
|  | // met: | 
|  | // | 
|  | //     * Redistributions of source code must retain the above copyright | 
|  | // notice, this list of conditions and the following disclaimer. | 
|  | //     * Redistributions in binary form must reproduce the above | 
|  | // copyright notice, this list of conditions and the following disclaimer | 
|  | // in the documentation and/or other materials provided with the | 
|  | // distribution. | 
|  | //     * Neither the name of Google Inc. nor the names of its | 
|  | // contributors may be used to endorse or promote products derived from | 
|  | // this software without specific prior written permission. | 
|  | // | 
|  | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | 
|  | // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | 
|  | // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | 
|  | // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT | 
|  | // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, | 
|  | // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT | 
|  | // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, | 
|  | // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY | 
|  | // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | 
|  | // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 
|  | // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 
|  |  | 
|  | // macho_id.cc: Functions to gather identifying information from a macho file | 
|  | // | 
|  | // See macho_id.h for documentation | 
|  | // | 
|  | // Author: Dan Waylonis | 
|  |  | 
|  |  | 
|  | #include <fcntl.h> | 
|  | #include <mach-o/loader.h> | 
|  | #include <stdio.h> | 
|  | #include <stdlib.h> | 
|  | #include <string.h> | 
|  | #include <sys/time.h> | 
|  | #include <sys/types.h> | 
|  | #include <unistd.h> | 
|  |  | 
|  | #include "common/mac/macho_id.h" | 
|  | #include "common/mac/macho_walker.h" | 
|  | #include "common/mac/macho_utilities.h" | 
|  |  | 
|  | namespace MacFileUtilities { | 
|  |  | 
|  | using google_breakpad::MD5Init; | 
|  | using google_breakpad::MD5Update; | 
|  | using google_breakpad::MD5Final; | 
|  |  | 
|  | MachoID::MachoID(const char *path) | 
|  | : memory_(0), | 
|  | memory_size_(0), | 
|  | crc_(0), | 
|  | md5_context_(), | 
|  | update_function_(NULL) { | 
|  | snprintf(path_, sizeof(path_), "%s", path); | 
|  | } | 
|  |  | 
|  | MachoID::MachoID(const char *path, void *memory, size_t size) | 
|  | : memory_(memory), | 
|  | memory_size_(size), | 
|  | crc_(0), | 
|  | md5_context_(), | 
|  | update_function_(NULL) { | 
|  | snprintf(path_, sizeof(path_), "%s", path); | 
|  | } | 
|  |  | 
|  | MachoID::~MachoID() { | 
|  | } | 
|  |  | 
|  | // The CRC info is from http://en.wikipedia.org/wiki/Adler-32 | 
|  | // With optimizations from http://www.zlib.net/ | 
|  |  | 
|  | // The largest prime smaller than 65536 | 
|  | #define MOD_ADLER 65521 | 
|  | // MAX_BLOCK is the largest n such that 255n(n+1)/2 + (n+1)(MAX_BLOCK-1) <= 2^32-1 | 
|  | #define MAX_BLOCK 5552 | 
|  |  | 
|  | void MachoID::UpdateCRC(unsigned char *bytes, size_t size) { | 
|  | // Unrolled loops for summing | 
|  | #define DO1(buf,i)  {sum1 += (buf)[i]; sum2 += sum1;} | 
|  | #define DO2(buf,i)  DO1(buf,i); DO1(buf,i+1); | 
|  | #define DO4(buf,i)  DO2(buf,i); DO2(buf,i+2); | 
|  | #define DO8(buf,i)  DO4(buf,i); DO4(buf,i+4); | 
|  | #define DO16(buf)   DO8(buf,0); DO8(buf,8); | 
|  | // Split up the crc | 
|  | uint32_t sum1 = crc_ & 0xFFFF; | 
|  | uint32_t sum2 = (crc_ >> 16) & 0xFFFF; | 
|  |  | 
|  | // Do large blocks | 
|  | while (size >= MAX_BLOCK) { | 
|  | size -= MAX_BLOCK; | 
|  | int block_count = MAX_BLOCK / 16; | 
|  | do { | 
|  | DO16(bytes); | 
|  | bytes += 16; | 
|  | } while (--block_count); | 
|  | sum1 %= MOD_ADLER; | 
|  | sum2 %= MOD_ADLER; | 
|  | } | 
|  |  | 
|  | // Do remaining bytes | 
|  | if (size) { | 
|  | while (size >= 16) { | 
|  | size -= 16; | 
|  | DO16(bytes); | 
|  | bytes += 16; | 
|  | } | 
|  | while (size--) { | 
|  | sum1 += *bytes++; | 
|  | sum2 += sum1; | 
|  | } | 
|  | sum1 %= MOD_ADLER; | 
|  | sum2 %= MOD_ADLER; | 
|  | crc_ = (sum2 << 16) | sum1; | 
|  | } | 
|  | } | 
|  |  | 
|  | void MachoID::UpdateMD5(unsigned char *bytes, size_t size) { | 
|  | MD5Update(&md5_context_, bytes, static_cast<unsigned>(size)); | 
|  | } | 
|  |  | 
|  | void MachoID::Update(MachoWalker *walker, off_t offset, size_t size) { | 
|  | if (!update_function_ || !size) | 
|  | return; | 
|  |  | 
|  | // Read up to 4k bytes at a time | 
|  | unsigned char buffer[4096]; | 
|  | size_t buffer_size; | 
|  | off_t file_offset = offset; | 
|  | while (size > 0) { | 
|  | if (size > sizeof(buffer)) { | 
|  | buffer_size = sizeof(buffer); | 
|  | size -= buffer_size; | 
|  | } else { | 
|  | buffer_size = size; | 
|  | size = 0; | 
|  | } | 
|  |  | 
|  | if (!walker->ReadBytes(buffer, buffer_size, file_offset)) | 
|  | return; | 
|  |  | 
|  | (this->*update_function_)(buffer, buffer_size); | 
|  | file_offset += buffer_size; | 
|  | } | 
|  | } | 
|  |  | 
|  | bool MachoID::UUIDCommand(cpu_type_t cpu_type, | 
|  | cpu_subtype_t cpu_subtype, | 
|  | unsigned char bytes[16]) { | 
|  | struct breakpad_uuid_command uuid_cmd; | 
|  | uuid_cmd.cmd = 0; | 
|  | if (!WalkHeader(cpu_type, cpu_subtype, UUIDWalkerCB, &uuid_cmd)) | 
|  | return false; | 
|  |  | 
|  | // If we found the command, we'll have initialized the uuid_command | 
|  | // structure | 
|  | if (uuid_cmd.cmd == LC_UUID) { | 
|  | memcpy(bytes, uuid_cmd.uuid, sizeof(uuid_cmd.uuid)); | 
|  | return true; | 
|  | } | 
|  |  | 
|  | return false; | 
|  | } | 
|  |  | 
|  | bool MachoID::IDCommand(cpu_type_t cpu_type, | 
|  | cpu_subtype_t cpu_subtype, | 
|  | unsigned char identifier[16]) { | 
|  | struct dylib_command dylib_cmd; | 
|  | dylib_cmd.cmd = 0; | 
|  | if (!WalkHeader(cpu_type, cpu_subtype, IDWalkerCB, &dylib_cmd)) | 
|  | return false; | 
|  |  | 
|  | // If we found the command, we'll have initialized the dylib_command | 
|  | // structure | 
|  | if (dylib_cmd.cmd == LC_ID_DYLIB) { | 
|  | // Take the hashed filename, version, and compatability version bytes | 
|  | // to form the first 12 bytes, pad the rest with zeros | 
|  |  | 
|  | // create a crude hash of the filename to generate the first 4 bytes | 
|  | identifier[0] = 0; | 
|  | identifier[1] = 0; | 
|  | identifier[2] = 0; | 
|  | identifier[3] = 0; | 
|  |  | 
|  | for (int j = 0, i = (int)strlen(path_)-1; i>=0 && path_[i]!='/'; ++j, --i) { | 
|  | identifier[j%4] += path_[i]; | 
|  | } | 
|  |  | 
|  | identifier[4] = (dylib_cmd.dylib.current_version >> 24) & 0xFF; | 
|  | identifier[5] = (dylib_cmd.dylib.current_version >> 16) & 0xFF; | 
|  | identifier[6] = (dylib_cmd.dylib.current_version >> 8) & 0xFF; | 
|  | identifier[7] = dylib_cmd.dylib.current_version & 0xFF; | 
|  | identifier[8] = (dylib_cmd.dylib.compatibility_version >> 24) & 0xFF; | 
|  | identifier[9] = (dylib_cmd.dylib.compatibility_version >> 16) & 0xFF; | 
|  | identifier[10] = (dylib_cmd.dylib.compatibility_version >> 8) & 0xFF; | 
|  | identifier[11] = dylib_cmd.dylib.compatibility_version & 0xFF; | 
|  | identifier[12] = (cpu_type >> 24) & 0xFF; | 
|  | identifier[13] = (cpu_type >> 16) & 0xFF; | 
|  | identifier[14] = (cpu_type >> 8) & 0xFF; | 
|  | identifier[15] = cpu_type & 0xFF; | 
|  |  | 
|  | return true; | 
|  | } | 
|  |  | 
|  | return false; | 
|  | } | 
|  |  | 
|  | uint32_t MachoID::Adler32(cpu_type_t cpu_type, cpu_subtype_t cpu_subtype) { | 
|  | update_function_ = &MachoID::UpdateCRC; | 
|  | crc_ = 0; | 
|  |  | 
|  | if (!WalkHeader(cpu_type, cpu_subtype, WalkerCB, this)) | 
|  | return 0; | 
|  |  | 
|  | return crc_; | 
|  | } | 
|  |  | 
|  | bool MachoID::MD5(cpu_type_t cpu_type, cpu_subtype_t cpu_subtype, unsigned char identifier[16]) { | 
|  | update_function_ = &MachoID::UpdateMD5; | 
|  |  | 
|  | MD5Init(&md5_context_); | 
|  |  | 
|  | if (!WalkHeader(cpu_type, cpu_subtype, WalkerCB, this)) | 
|  | return false; | 
|  |  | 
|  | MD5Final(identifier, &md5_context_); | 
|  | return true; | 
|  | } | 
|  |  | 
|  | bool MachoID::WalkHeader(cpu_type_t cpu_type, | 
|  | cpu_subtype_t cpu_subtype, | 
|  | MachoWalker::LoadCommandCallback callback, | 
|  | void *context) { | 
|  | if (memory_) { | 
|  | MachoWalker walker(memory_, memory_size_, callback, context); | 
|  | return walker.WalkHeader(cpu_type, cpu_subtype); | 
|  | } else { | 
|  | MachoWalker walker(path_, callback, context); | 
|  | return walker.WalkHeader(cpu_type, cpu_subtype); | 
|  | } | 
|  | } | 
|  |  | 
|  | // static | 
|  | bool MachoID::WalkerCB(MachoWalker *walker, load_command *cmd, off_t offset, | 
|  | bool swap, void *context) { | 
|  | MachoID *macho_id = (MachoID *)context; | 
|  |  | 
|  | if (cmd->cmd == LC_SEGMENT) { | 
|  | struct segment_command seg; | 
|  |  | 
|  | if (!walker->ReadBytes(&seg, sizeof(seg), offset)) | 
|  | return false; | 
|  |  | 
|  | if (swap) | 
|  | breakpad_swap_segment_command(&seg); | 
|  |  | 
|  | struct mach_header_64 header; | 
|  | off_t header_offset; | 
|  |  | 
|  | if (!walker->CurrentHeader(&header, &header_offset)) | 
|  | return false; | 
|  |  | 
|  | // Process segments that have sections: | 
|  | // (e.g., __TEXT, __DATA, __IMPORT, __OBJC) | 
|  | offset += sizeof(struct segment_command); | 
|  | struct section sec; | 
|  | for (unsigned long i = 0; i < seg.nsects; ++i) { | 
|  | if (!walker->ReadBytes(&sec, sizeof(sec), offset)) | 
|  | return false; | 
|  |  | 
|  | if (swap) | 
|  | breakpad_swap_section(&sec, 1); | 
|  |  | 
|  | // sections of type S_ZEROFILL are "virtual" and contain no data | 
|  | // in the file itself | 
|  | if ((sec.flags & SECTION_TYPE) != S_ZEROFILL && sec.offset != 0) | 
|  | macho_id->Update(walker, header_offset + sec.offset, sec.size); | 
|  |  | 
|  | offset += sizeof(struct section); | 
|  | } | 
|  | } else if (cmd->cmd == LC_SEGMENT_64) { | 
|  | struct segment_command_64 seg64; | 
|  |  | 
|  | if (!walker->ReadBytes(&seg64, sizeof(seg64), offset)) | 
|  | return false; | 
|  |  | 
|  | if (swap) | 
|  | breakpad_swap_segment_command_64(&seg64); | 
|  |  | 
|  | struct mach_header_64 header; | 
|  | off_t header_offset; | 
|  |  | 
|  | if (!walker->CurrentHeader(&header, &header_offset)) | 
|  | return false; | 
|  |  | 
|  | // Process segments that have sections: | 
|  | // (e.g., __TEXT, __DATA, __IMPORT, __OBJC) | 
|  | offset += sizeof(struct segment_command_64); | 
|  | struct section_64 sec64; | 
|  | for (unsigned long i = 0; i < seg64.nsects; ++i) { | 
|  | if (!walker->ReadBytes(&sec64, sizeof(sec64), offset)) | 
|  | return false; | 
|  |  | 
|  | if (swap) | 
|  | breakpad_swap_section_64(&sec64, 1); | 
|  |  | 
|  | // sections of type S_ZEROFILL are "virtual" and contain no data | 
|  | // in the file itself | 
|  | if ((sec64.flags & SECTION_TYPE) != S_ZEROFILL && sec64.offset != 0) | 
|  | macho_id->Update(walker, | 
|  | header_offset + sec64.offset, | 
|  | (size_t)sec64.size); | 
|  |  | 
|  | offset += sizeof(struct section_64); | 
|  | } | 
|  | } | 
|  |  | 
|  | // Continue processing | 
|  | return true; | 
|  | } | 
|  |  | 
|  | // static | 
|  | bool MachoID::UUIDWalkerCB(MachoWalker *walker, load_command *cmd, off_t offset, | 
|  | bool swap, void *context) { | 
|  | if (cmd->cmd == LC_UUID) { | 
|  | struct breakpad_uuid_command *uuid_cmd = | 
|  | (struct breakpad_uuid_command *)context; | 
|  |  | 
|  | if (!walker->ReadBytes(uuid_cmd, sizeof(struct breakpad_uuid_command), | 
|  | offset)) | 
|  | return false; | 
|  |  | 
|  | if (swap) | 
|  | breakpad_swap_uuid_command(uuid_cmd); | 
|  |  | 
|  | return false; | 
|  | } | 
|  |  | 
|  | // Continue processing | 
|  | return true; | 
|  | } | 
|  |  | 
|  | // static | 
|  | bool MachoID::IDWalkerCB(MachoWalker *walker, load_command *cmd, off_t offset, | 
|  | bool swap, void *context) { | 
|  | if (cmd->cmd == LC_ID_DYLIB) { | 
|  | struct dylib_command *dylib_cmd = (struct dylib_command *)context; | 
|  |  | 
|  | if (!walker->ReadBytes(dylib_cmd, sizeof(struct dylib_command), offset)) | 
|  | return false; | 
|  |  | 
|  | if (swap) | 
|  | breakpad_swap_dylib_command(dylib_cmd); | 
|  |  | 
|  | return false; | 
|  | } | 
|  |  | 
|  | // Continue processing | 
|  | return true; | 
|  | } | 
|  |  | 
|  | }  // namespace MacFileUtilities |