// Copyright 2014 Renato Tegon Forti, Antony Polukhin. // Copyright Antony Polukhin, 2015-2025. // // Distributed under the Boost Software License, Version 1.0. // (See accompanying file LICENSE_1_0.txt // or copy at http://www.boost.org/LICENSE_1_0.txt) #ifndef BOOST_DLL_DETAIL_MACHO_INFO_HPP #define BOOST_DLL_DETAIL_MACHO_INFO_HPP #include #ifdef BOOST_HAS_PRAGMA_ONCE # pragma once #endif #include #include #include #include // for std::getline #include namespace boost { namespace dll { namespace detail { using integer_t = int; using vm_prot_t = int; using cpu_type_t = integer_t; using cpu_subtype_t = integer_t; template struct mach_header_template { std::uint32_t magic; cpu_type_t cputype; cpu_subtype_t cpusubtype; std::uint32_t filetype; std::uint32_t ncmds; std::uint32_t sizeofcmds; std::uint32_t flags[sizeof(AddressOffsetT) / sizeof(std::uint32_t)]; // Flags and reserved }; using mach_header_32_ = mach_header_template; using mach_header_64_ = mach_header_template; struct load_command_ { std::uint32_t cmd; /* type of command */ std::uint32_t cmdsize; }; struct load_command_types { static constexpr std::uint32_t LC_SEGMENT_ = 0x1; /* segment of this file to be mapped */ static constexpr std::uint32_t LC_SYMTAB_ = 0x2; /* link-edit stab symbol table info */ static constexpr std::uint32_t LC_SYMSEG_ = 0x3; /* link-edit gdb symbol table info (obsolete) */ static constexpr std::uint32_t LC_THREAD_ = 0x4; /* thread */ static constexpr std::uint32_t LC_UNIXTHREAD_ = 0x5; /* unix thread (includes a stack) */ static constexpr std::uint32_t LC_LOADFVMLIB_ = 0x6; /* load a specified fixed VM shared library */ static constexpr std::uint32_t LC_IDFVMLIB_ = 0x7; /* fixed VM shared library identification */ static constexpr std::uint32_t LC_IDENT_ = 0x8; /* object identification info (obsolete) */ static constexpr std::uint32_t LC_FVMFILE_ = 0x9; /* fixed VM file inclusion (internal use) */ static constexpr std::uint32_t LC_PREPAGE_ = 0xa; /* prepage command (internal use) */ static constexpr std::uint32_t LC_DYSYMTAB_ = 0xb; /* dynamic link-edit symbol table info */ static constexpr std::uint32_t LC_LOAD_DYLIB_ = 0xc; /* load a dynamically linked shared library */ static constexpr std::uint32_t LC_ID_DYLIB_ = 0xd; /* dynamically linked shared lib ident */ static constexpr std::uint32_t LC_LOAD_DYLINKER_ = 0xe; /* load a dynamic linker */ static constexpr std::uint32_t LC_ID_DYLINKER_ = 0xf; /* dynamic linker identification */ static constexpr std::uint32_t LC_PREBOUND_DYLIB_ = 0x10; /* modules prebound for a dynamically linked shared library */ static constexpr std::uint32_t LC_ROUTINES_ = 0x11; /* image routines */ static constexpr std::uint32_t LC_SUB_FRAMEWORK_ = 0x12; /* sub framework */ static constexpr std::uint32_t LC_SUB_UMBRELLA_ = 0x13; /* sub umbrella */ static constexpr std::uint32_t LC_SUB_CLIENT_ = 0x14; /* sub client */ static constexpr std::uint32_t LC_SUB_LIBRARY_ = 0x15; /* sub library */ static constexpr std::uint32_t LC_TWOLEVEL_HINTS_ = 0x16; /* two-level namespace lookup hints */ static constexpr std::uint32_t LC_PREBIND_CKSUM_ = 0x17; /* prebind checksum */ /* * After MacOS X 10.1 when a new load command is added that is required to be * understood by the dynamic linker for the image to execute properly the * LC_REQ_DYLD bit will be or'ed into the load command constant. If the dynamic * linker sees such a load command it it does not understand will issue a * "unknown load command required for execution" error and refuse to use the * image. Other load commands without this bit that are not understood will * simply be ignored. */ static constexpr std::uint32_t LC_REQ_DYLD_ = 0x80000000; /* * load a dynamically linked shared library that is allowed to be missing * (all symbols are weak imported). */ static constexpr std::uint32_t LC_LOAD_WEAK_DYLIB_ = (0x18 | LC_REQ_DYLD_); static constexpr std::uint32_t LC_SEGMENT_64_ = 0x19; /* 64-bit segment of this file to be mapped */ static constexpr std::uint32_t LC_ROUTINES_64_ = 0x1a; /* 64-bit image routines */ static constexpr std::uint32_t LC_UUID_ = 0x1b; /* the uuid */ static constexpr std::uint32_t LC_RPATH_ = (0x1c | LC_REQ_DYLD_); /* runpath additions */ static constexpr std::uint32_t LC_CODE_SIGNATURE_ = 0x1d; /* local of code signature */ static constexpr std::uint32_t LC_SEGMENT_SPLIT_INFO_= 0x1e; /* local of info to split segments */ static constexpr std::uint32_t LC_REEXPORT_DYLIB_ = (0x1f | LC_REQ_DYLD_); /* load and re-export dylib */ static constexpr std::uint32_t LC_LAZY_LOAD_DYLIB_ = 0x20; /* delay load of dylib until first use */ static constexpr std::uint32_t LC_ENCRYPTION_INFO_ = 0x21; /* encrypted segment information */ static constexpr std::uint32_t LC_DYLD_INFO_ = 0x22; /* compressed dyld information */ static constexpr std::uint32_t LC_DYLD_INFO_ONLY_ = (0x22|LC_REQ_DYLD_); /* compressed dyld information only */ }; template struct segment_command_template { std::uint32_t cmd; /* LC_SEGMENT_ */ std::uint32_t cmdsize; /* includes sizeof section structs */ char segname[16]; /* segment name */ AddressOffsetT vmaddr; /* memory address of this segment */ AddressOffsetT vmsize; /* memory size of this segment */ AddressOffsetT fileoff; /* file offset of this segment */ AddressOffsetT filesize; /* amount to map from the file */ vm_prot_t maxprot; /* maximum VM protection */ vm_prot_t initprot; /* initial VM protection */ std::uint32_t nsects; /* number of sections in segment */ std::uint32_t flags; /* flags */ }; using segment_command_32_ = segment_command_template; using segment_command_64_ = segment_command_template; template struct section_template { char sectname[16]; /* name of this section */ char segname[16]; /* segment this section goes in */ AddressOffsetT addr; /* memory address of this section */ AddressOffsetT size; /* size in bytes of this section */ std::uint32_t offset; /* file offset of this section */ std::uint32_t align; /* section alignment (power of 2) */ std::uint32_t reloff; /* file offset of relocation entries */ std::uint32_t nreloc; /* number of relocation entries */ std::uint32_t flags; /* flags (section type and attributes)*/ std::uint32_t reserved[1 + sizeof(AddressOffsetT) / sizeof(std::uint32_t)]; }; using section_32_ = section_template ; using section_64_ = section_template; struct symtab_command_ { std::uint32_t cmd; /* LC_SYMTAB_ */ std::uint32_t cmdsize; /* sizeof(struct symtab_command) */ std::uint32_t symoff; /* symbol table offset */ std::uint32_t nsyms; /* number of symbol table entries */ std::uint32_t stroff; /* string table offset */ std::uint32_t strsize; /* string table size in bytes */ }; template struct nlist_template { std::uint32_t n_strx; std::uint8_t n_type; std::uint8_t n_sect; std::uint16_t n_desc; AddressOffsetT n_value; }; using nlist_32_ = nlist_template ; using nlist_64_ = nlist_template ; template class macho_info { using header_t = boost::dll::detail::mach_header_template; using load_command_t = boost::dll::detail::load_command_; using segment_t = boost::dll::detail::segment_command_template; using section_t = boost::dll::detail::section_template; using symbol_header_t = boost::dll::detail::symtab_command_; using nlist_t = boost::dll::detail::nlist_template; static constexpr std::uint32_t SEGMENT_CMD_NUMBER = (sizeof(AddressOffsetT) > 4 ? load_command_types::LC_SEGMENT_64_ : load_command_types::LC_SEGMENT_); public: static bool parsing_supported(std::ifstream& fs) { static const uint32_t magic_bytes = (sizeof(AddressOffsetT) <= sizeof(uint32_t) ? 0xfeedface : 0xfeedfacf); uint32_t magic; fs.seekg(0); fs.read(reinterpret_cast(&magic), sizeof(magic)); return (magic_bytes == magic); } private: template static void read_raw(std::ifstream& fs, T& value, std::size_t size = sizeof(T)) { fs.read(reinterpret_cast(&value), size); } template static void command_finder(std::ifstream& fs, uint32_t cmd_num, F callback_f) { const header_t h = header(fs); load_command_t command; fs.seekg(sizeof(header_t)); for (std::size_t i = 0; i < h.ncmds; ++i) { const std::ifstream::pos_type pos = fs.tellg(); read_raw(fs, command); if (command.cmd != cmd_num) { fs.seekg(pos + static_cast(command.cmdsize)); continue; } fs.seekg(pos); callback_f(fs); fs.seekg(pos + static_cast(command.cmdsize)); } } struct section_names_gather { std::vector& ret; void operator()(std::ifstream& fs) const { segment_t segment; read_raw(fs, segment); section_t section; ret.reserve(ret.size() + segment.nsects); for (std::size_t j = 0; j < segment.nsects; ++j) { read_raw(fs, section); // `segname` goes right after the `sectname`. // Forcing `sectname` to end on '\0' section.segname[0] = '\0'; ret.push_back(section.sectname); if (ret.back().empty()) { ret.pop_back(); // Do not show empty names } } } }; struct symbol_names_gather { std::vector& ret; std::size_t section_index; void operator()(std::ifstream& fs) const { symbol_header_t symbh; read_raw(fs, symbh); ret.reserve(ret.size() + symbh.nsyms); nlist_t symbol; std::string symbol_name; for (std::size_t j = 0; j < symbh.nsyms; ++j) { fs.seekg(symbh.symoff + j * sizeof(nlist_t)); read_raw(fs, symbol); if (!symbol.n_strx) { continue; // Symbol has no name } if ((symbol.n_type & 0x0e) != 0xe || !symbol.n_sect) { continue; // Symbol has no section } if (section_index && section_index != symbol.n_sect) { continue; // Not in the required section } fs.seekg(symbh.stroff + symbol.n_strx); std::getline(fs, symbol_name, '\0'); if (symbol_name.empty()) { continue; } if (symbol_name[0] == '_') { // Linker adds additional '_' symbol. Could not find official docs for that case. ret.push_back(symbol_name.c_str() + 1); } else { ret.push_back(symbol_name); } } } }; public: static std::vector sections(std::ifstream& fs) { std::vector ret; section_names_gather f = { ret }; command_finder(fs, SEGMENT_CMD_NUMBER, f); return ret; } private: static header_t header(std::ifstream& fs) { header_t h; fs.seekg(0); read_raw(fs, h); return h; } public: static std::vector symbols(std::ifstream& fs) { std::vector ret; symbol_names_gather f = { ret, 0 }; command_finder(fs, load_command_types::LC_SYMTAB_, f); return ret; } static std::vector symbols(std::ifstream& fs, const char* section_name) { // Not very optimal solution std::vector ret = sections(fs); std::vector::iterator it = std::find(ret.begin(), ret.end(), section_name); if (it == ret.end()) { // No section with such name ret.clear(); return ret; } // section indexes start from 1 symbol_names_gather f = { ret, static_cast(1 + (it - ret.begin())) }; ret.clear(); command_finder(fs, load_command_types::LC_SYMTAB_, f); return ret; } }; using macho_info32 = macho_info; using macho_info64 = macho_info; }}} // namespace boost::dll::detail #endif // BOOST_DLL_DETAIL_MACHO_INFO_HPP