简介
- Mach-O 是 Mach 目标文件格式的缩写,是一种用于可执行文件、目标代码、共享库、动态加载代码和核心转储的文件格式
- 对mach-o对解析需要考虑到两点:
- 有的文件是以典型的mac-o头开始的
- 而有的文件则是以一个fat头开始的(详细如下文)
查看工具
otool
1 2 3 4 5 6 7 |
otool -h libuecm.dylib # 显示如下 libuecm.dylib: Mach header magic cputype cpusubtype caps filetype ncmds sizeofcmds flags 0xfeedfacf 16777223 3 0x00 6 16 1640 0x00118085 |
machOView
- 用这个图形工具打开目标文件,查看详细信息
Editor
mach-o结构
典型的mach-o
- mach-o header
- 包含有关二进制文件的一般信息
- load commands
- 它是一种目录,描述了段的位置、符号表、动态符号表等。每个加载命令都包含一个元信息,例如命令类型、名称、二进制文件中的位置等
- data
- 包含代码和数据,如符号表、动态符号表等
通用文件结构,也称fat file
- fat header
- 存放了fat file信息,以及不同架构的mach-o的位置
- mach-o header
- load commands
- data
- mach-o header
- load commands
- data
区别
- Mach-O 文件包含一种架构(i386、x86_64、arm64 等)的目标代码。
- Fat 二进制文件可能包含多个目标文件,因此包含不同架构(i386 和 x86_64、arm 和 arm64、 ETC。)
结构体
mach-o
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 |
// 32-bit struct mach_header { uint32_t magic; cpu_type_t cputype; cpu_subtype_t cpusubtype; uint32_t filetype; uint32_t ncmds; uint32_t sizeofcmds; uint32_t flags; }; struct segment_command { uint32_t cmd; uint32_t cmdsize; char segname[16]; uint32_t vmaddr; uint32_t vmsize; uint32_t fileoff; uint32_t filesize; vm_prot_t maxprot; vm_prot_t initprot; uint32_t nsects; uint32_t flags; }; // 64-bit struct mach_header_64 { uint32_t magic; /* mach magic number identifier */ int32_t cputype; /* cpu specifier */ int32_t cpusubtype; /* machine specifier */ uint32_t filetype; /* type of file */ uint32_t ncmds; /* number of load commands */ uint32_t sizeofcmds; /* the size of all the load commands */ uint32_t flags; /* flags */ uint32_t reserved; /* reserved */ }; struct segment_command_64 { /* for 64-bit architectures */ uint32_t cmd; /* LC_SEGMENT_64 */ uint32_t cmdsize; /* includes sizeof section_64 structs */ char segname[16]; /* segment name */ uint64_t vmaddr; /* memory address of this segment */ uint64_t vmsize; /* memory size of this segment */ uint64_t fileoff; /* file offset of this segment */ uint64_t filesize; /* amount to map from the file */ int32_t maxprot; /* maximum VM protection */ int32_t initprot; /* initial VM protection */ uint32_t nsects; /* number of sections in segment */ uint32_t flags; /* flags */ }; |
解析
mach_o.h
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 |
#ifndef TESTPRO_COMMON_MAC_COMMON_MACH_O_H_ #define TESTPRO_COMMON_MAC_COMMON_MACH_O_H_ #include <stdio.h> #include <stdlib.h> namespace mac_common { class en_mach_o { public: explicit en_mach_o(const char *filename); ~en_mach_o(); void segments(); bool is_parse_success(); bool is_file_execute(); private: uint32_t read_magic(FILE *obj_file, int offset); bool is_magic_64(); bool should_swap_bytes(); void mach_o_header(int offset, bool is_64, bool should_swap); void fat_header(int is_swap); bool is_fat(); private: bool state_; uint32_t magic_; uint32_t file_type_; FILE * file_; }; } // namespace mac_common #endif //TESTPRO_COMMON_MAC_COMMON_MACH_O_H_ |
mach_o.cpp
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 |
#include "mach_o.h" #include <mach-o/loader.h> #include <mach-o/swap.h> #include <boost/filesystem.hpp> namespace mac_common { #define SWAP32(x) ((((x) & 0xff000000) >> 24) | (((x) & 0xff0000) >> 8) | (((x) & 0xff00) << 8) | (((x) & 0xff) << 24)) en_mach_o::en_mach_o(const char *filename) : file_(nullptr), state_(false), file_type_(0), magic_(0) { if (!boost::filesystem::exists(filename)) { return; } file_ = fopen(filename, "rb"); if (!file_) { return; } magic_ = read_magic(file_, 0); if (magic_ != 0) { state_ = true; } } en_mach_o::~en_mach_o() { if (file_) { fclose(file_); } } void en_mach_o::segments() { if (!file_) { return; } if (magic_ == 0) { return; } auto is_64 = is_magic_64(); auto is_swap = should_swap_bytes(); auto is_fat_file = is_fat(); if (is_fat_file) { fat_header(is_swap); } else { mach_o_header(0, is_64, is_swap); } } bool en_mach_o::is_parse_success() { return state_; } bool en_mach_o::is_file_execute() { return file_type_ == MH_EXECUTE; } uint32_t en_mach_o::read_magic(FILE *obj_file, int offset) { if (!obj_file) { return 0; } uint32_t magic(0); fseek(obj_file, offset, SEEK_SET); fread(&magic, sizeof(uint32_t), 1, obj_file); return magic; } bool en_mach_o::is_magic_64() { return magic_ == MH_MAGIC_64 || magic_ == MH_CIGAM_64; } bool en_mach_o::should_swap_bytes() { return magic_ == MH_CIGAM || magic_ == MH_CIGAM_64; } void* load_bytes(FILE *obj_file, int offset, int size) { void *buf = calloc(1, size); fseek(obj_file, offset, SEEK_SET); fread(buf, size, 1, obj_file); return buf; } void en_mach_o::mach_o_header(int offset, bool is_64, bool should_swap) { if (!file_) { return; } if (is_64) { int header_size = sizeof(struct mach_header_64); auto ptr = load_bytes(file_, offset, header_size); if (!ptr) { return; } struct mach_header_64 *header = static_cast<mach_header_64 *>(ptr); if (should_swap) { swap_mach_header_64(header, NX_UnknownByteOrder); } file_type_ = header->filetype; free(header); } else { int header_size = sizeof(struct mach_header); auto ptr = load_bytes(file_, offset, header_size); struct mach_header *header = static_cast<mach_header *>(ptr); if (should_swap) { swap_mach_header(header, NX_UnknownByteOrder); } file_type_ = header->filetype; free(header); } } void en_mach_o::fat_header(int is_swap) { if (!file_) { return; } size_t header_size = sizeof(struct fat_header); size_t arch_size = sizeof(struct fat_arch); auto ptr = load_bytes(file_, 0, header_size); struct fat_header *header = static_cast<struct fat_header*>(ptr); if (is_swap) { swap_fat_header(header, NX_UnknownByteOrder); } off_t arch_offset = (off_t)header_size; auto num = SWAP32(header->nfat_arch); for (uint32_t i = 0U; i < num; i++) { auto p = load_bytes(file_, arch_offset, arch_size); struct fat_arch *arch = static_cast<fat_arch*>(p); if (is_swap) { swap_fat_arch(arch, 1, NX_UnknownByteOrder); } off_t mach_header_offset = (off_t)(SWAP32(arch->offset)); free(arch); arch_offset += arch_size; magic_ = read_magic(file_, mach_header_offset+1); if (is_file_execute()) { break; } auto is_64 = is_magic_64(); auto is_swap_mach = should_swap_bytes(); mach_o_header(mach_header_offset, is_64, is_swap_mach); } free(header); } bool en_mach_o::is_fat() { return magic_ == FAT_MAGIC || magic_ == FAT_CIGAM; } } // namespace mac_common |
使用
- 上述解析代码,并没有写关于load_commands的部分
- 上述解析代码,包含了获取常规mach-o头和fat头的信息的功能
- 在封装时只封装了判断一个文件是不是可执行文件,像其他的cpu信息,架构信息等,也是可以获取
1 2 3 4 5 6 |
// a file path mac_common::en_mach_o mach(path.string().c_str()); mach.segments(); if (mach.is_parse_success() && mach.is_file_execute()) { //res.push_back(path.string()); } |
本文为原创文章,版权归Aet所有,欢迎分享本文,转载请保留出处!
你可能也喜欢
- ♥ 深入理解C++11:C++11新特性解析与应用 一12/21
- ♥ 深度探索C++对象模型一02/09
- ♥ Macos开发问题:aarch64架构宏不识别06/25
- ♥ C++标准模板库编程实战_智能指针11/30
- ♥ Macos网络信息相关06/06
- ♥ Cef:介绍06/29