Question

我正在开发一个使用内存映射nm实现基本mmap的项目。我已经能够使用代码解析64位二进制文件：

void        handle_64(char *ptr)
{
    int                     ncmds;
    struct mach_header_64   *header;
    struct load_command     *lc;
    struct symtab_command   *sym;
    int                     i;

    i = 0;
    header = (struct mach_header_64 *)ptr;
    ncmds = header->ncmds;
    lc = (void *)ptr + sizeof(*header);
    while (i < ncmds)
    {
        if (lc->cmd == LC_SYMTAB)
        {
            sym = (struct symtab_command *)lc;
            build_list (sym->nsyms, sym->symoff, sym->stroff, ptr);
            break;
         }
         lc = (void *) lc + lc->cmdsize;
         i++;
    }
}

根据这个link，mach-o和fat二进制文件之间的唯一区别是它上面的fat_header结构，但只是跳过

lc = (void *)ptr + sizeof(struct fat_header) + sizeof(struct mach_header_64);

没有让我进入load_command区域（segfault）。如何访问fat / universal二进制文件的加载命令。

我正在使用运行macOS High Sierra的64位Mac。谢谢。

Answer 1

您遇到了多个问题：

你链接到哪个博客的电话＆＃34;胖标题＆＃34;不仅仅是struct fat_header。
无法确保Mach-O标头在胖标头之后立即跟随，只需某处之后（通常Mach-O段要对齐到整个页面，所以在胖标题之后立即放置它们甚至可能不起作用。）

无处可以保证64位切片将成为二进制中的第一个，也不会有一个。

考虑到所有这些，如果您希望获得有用的结果，需要来解析胖头（而不是忽略它）。

现在，fat_header的定义如下：

struct fat_header { uint32_t magic; /* FAT_MAGIC or FAT_MAGIC_64 */ uint32_t nfat_arch; /* number of structs that follow */ };

首先，我通常在胖二进制文件中看到的神奇值是FAT_CIGAM而不是FAT_MAGIC，尽管注释另有说明（但请注意 - 这意味着胖头中的整数是大端而不是小端！）。但其次，表明某些结构遵循这个标题，即：

struct fat_arch { cpu_type_t cputype; /* cpu specifier (int) */ cpu_subtype_t cpusubtype; /* machine specifier (int) */ uint32_t offset; /* file offset to this object file */ uint32_t size; /* size of this object file */ uint32_t align; /* alignment as a power of 2 */ };

这与＃＆＃34;瘦＆＃34;的工作原理相同。 Mach-O标头使用其加载命令。 fat_arch.offset是从文件开头的偏移量。接下来，打印所有切片的Mach-O非常简单：

#include <stdio.h> #include <mach-o/fat.h> #define SWAP32(x) ((((x) & 0xff000000) >> 24) | (((x) & 0xff0000) >> 8) | (((x) & 0xff00) << 8) | (((x) & 0xff) << 24)) void print_fat_header(void *buf) { struct fat_header *hdr = buf; if(hdr->magic != FAT_CIGAM) { fprintf(stderr, "bad magic: %08x\n", hdr->magic); return; } struct fat_arch *archs = (struct fat_arch*)(hdr + 1); uint32_t num = SWAP32(hdr->nfat_arch); for(size_t i = 0; i < num; ++i) { const char *name = "unknown"; switch(SWAP32(archs[i].cputype)) { case CPU_TYPE_I386: name = "i386"; break; case CPU_TYPE_X86_64: name = "x86_64"; break; case CPU_TYPE_ARM: name = "arm"; break; case CPU_TYPE_ARM64: name = "arm64"; break; } uint32_t off = SWAP32(archs[i].offset); uint32_t magic = *(uint32_t*)((uintptr_t)buf + off); printf("%08x-%08x: %-8s (magic %8x)\n", off, off + SWAP32(archs[i].size), name, magic); } }

请注意，上述函数不完整，因为它不知道buf的长度，因此不能也不会检查任何被访问的内存。在一个严肃的实现中，你应该确保永远不会读到你给出的缓冲区之外。您的代码发生错误的事实也暗示它没有做足够的数据清理。

解析通用/胖二进制文件

1 个答案: