經過dlopen、dlsym獲取共享庫函數地址、全局變量是一種常常使用到的編程技巧,尤爲是在Hook框架中。然而不管是dlsym仍是一些經常使用框架(如Nougat_dlfunctions),都只能搜索**.dynsym段,而沒法搜索.symtab**段。所以實現.symtab段搜索是一個亟待解決的問題。git
本文將介紹在Nougat_dlfunctions框架基礎上,如何實現搜索.symtab段的功能。(若是對FastHook不瞭解,請查閱FastHook——一種高效穩定、簡潔易用的Android Hook框架) 項目地址:Enhanced_dlfunctionsgithub
ELF文件實際是個表結構,以段爲單位,每一個段存儲不一樣的信息,段與段之間以索引來關聯造成一個表。因此只要有一個頭,就能夠經過這些關係訪問全部的段,這個頭即是ELF文件頭。下面咱們來看看須要獲取那些信息:編程
void *enhanced_dlopen(const char *libpath, int flags) {
FILE *maps;
char buff[256];
struct ctx *ctx = 0;
off_t load_addr, size;
int k, fd = -1, found = 0;
void *shoff;
Elf_Ehdr *elf = (Elf_Ehdr *) MAP_FAILED;
#define fatal(fmt, args...) do { log_err(fmt,##args); goto err_exit; } while(0)
maps = fopen("/proc/self/maps", "r");
if (!maps) fatal("failed to open maps");
while (!found && fgets(buff, sizeof(buff), maps))
if (strstr(buff, "r-xp") && strstr(buff, libpath)) found = 1;
fclose(maps);
if (!found) fatal("%s not found in my userspace", libpath);
if (sscanf(buff, "%lx", &load_addr) != 1)
fatal("failed to read load address for %s", libpath);
log_info("%s loaded in Android at 0x%08lx", libpath, load_addr);
/* Now, mmap the same library once again */
fd = open(libpath, O_RDONLY);
if (fd < 0) fatal("failed to open %s", libpath);
size = lseek(fd, 0, SEEK_END);
if (size <= 0) fatal("lseek() failed for %s", libpath);
elf = (Elf_Ehdr *) mmap(0, size, PROT_READ, MAP_SHARED, fd, 0);
close(fd);
fd = -1;
if (elf == MAP_FAILED) fatal("mmap() failed for %s", libpath);
ctx = (struct ctx *) calloc(1, sizeof(struct ctx));
if (!ctx) fatal("no memory for %s", libpath);
ctx->load_addr = (void *) load_addr;
shoff = ((void *) elf) + elf->e_shoff;
Elf_Shdr *shstrtab = (Elf_Shdr *)(shoff + elf->e_shstrndx * elf->e_shentsize);
char * shstr = malloc(shstrtab->sh_size);
memcpy(shstr, ((void *) elf) + shstrtab->sh_offset, shstrtab->sh_size);
for (k = 0; k < elf->e_shnum; k++, shoff += elf->e_shentsize) {
Elf_Shdr *sh = (Elf_Shdr *) shoff;
log_dbg("%s: k=%d shdr=%p type=%d", __func__, k, sh, sh->sh_type);
switch (sh->sh_type) {
case SHT_DYNSYM:
if (ctx->dynsym) fatal("%s: duplicate DYNSYM sections", libpath); /* .dynsym */
ctx->dynsym = malloc(sh->sh_size);
if (!ctx->dynsym) fatal("%s: no memory for .dynsym", libpath);
memcpy(ctx->dynsym, ((void *) elf) + sh->sh_offset, sh->sh_size);
ctx->dynsym_num = (sh->sh_size / sizeof(Elf_Sym));
break;
case SHT_SYMTAB:
if (ctx->symtab) fatal("%s: duplicate SYMTAB sections", libpath); /* .symtab */
ctx->symtab = malloc(sh->sh_size);
if (!ctx->symtab) fatal("%s: no memory for .symtab", libpath);
memcpy(ctx->symtab, ((void *) elf) + sh->sh_offset, sh->sh_size);
ctx->symtab_num = (sh->sh_size / sizeof(Elf_Sym));
break;
case SHT_STRTAB:
if(!strcmp(shstr+sh->sh_name,".dynstr")) {
if (ctx->dynstr) break; /* .dynstr is guaranteed to be the first STRTAB */
ctx->dynstr = malloc(sh->sh_size);
if (!ctx->dynstr) fatal("%s: no memory for .dynstr", libpath);
memcpy(ctx->dynstr, ((void *) elf) + sh->sh_offset, sh->sh_size);
}else if(!strcmp(shstr+sh->sh_name,".strtab")) {
if (ctx->strtab) break;
ctx->strtab = malloc(sh->sh_size);
if (!ctx->strtab) fatal("%s: no memory for .strtab", libpath);
memcpy(ctx->strtab, ((void *) elf) + sh->sh_offset, sh->sh_size);
}
break;
case SHT_PROGBITS:
if (!ctx->dynstr || !ctx->dynsym || ctx->bias) break;
/* won't even bother checking against the section name */ ctx->bias = (off_t) sh->sh_addr - (off_t) sh->sh_offset; break; } } munmap(elf, size); elf = 0; if (!ctx->dynstr || !ctx->dynsym) fatal("dynamic sections not found in %s", libpath); #undef fatal log_dbg("%s: ok, dynsym = %p, dynstr = %p symtab = %p strtab = %p", libpath, ctx->dynsym, ctx->dynstr, ctx->symtab, ctx->strtab); return ctx; } 複製代碼
1. 獲取so加載的地址,存儲在load_addrbash
maps = fopen("/proc/self/maps", "r");
while (!found && fgets(buff, sizeof(buff), maps))
if (strstr(buff, "r-xp") && strstr(buff, libpath)) found = 1;
fclose(maps);
if (sscanf(buff, "%lx", &load_addr) != 1)
fatal("failed to read load address for %s", libpath);
複製代碼
2. 從新映射so,獲取ELF文件頭微信
fd = open(libpath, O_RDONLY);
size = lseek(fd, 0, SEEK_END);
elf = (Elf_Ehdr *) mmap(0, size, PROT_READ, MAP_SHARED, fd, 0);
複製代碼
3. 獲取.shstrtab段。框架
Elf_Shdr *shstrtab = (Elf_Shdr *)(shoff + elf->e_shstrndx * elf->e_shentsize);
char * shstr = malloc(shstrtab->sh_size);
memcpy(shstr, ((void *) elf) + shstrtab->sh_offset, shstrtab->sh_size);
複製代碼
4.獲取.dynsym段、.dynstr段、.symtab段、.strtab段函數
for (k = 0; k < elf->e_shnum; k++, shoff += elf->e_shentsize) {
Elf_Shdr *sh = (Elf_Shdr *) shoff;
switch (sh->sh_type) {
case SHT_DYNSYM:
ctx->dynsym = malloc(sh->sh_size);
memcpy(ctx->dynsym, ((void *) elf) + sh->sh_offset, sh->sh_size);
ctx->dynsym_num = (sh->sh_size / sizeof(Elf_Sym));
break;
case SHT_SYMTAB:
ctx->symtab = malloc(sh->sh_size);
memcpy(ctx->symtab, ((void *) elf) + sh->sh_offset, sh->sh_size);
ctx->symtab_num = (sh->sh_size / sizeof(Elf_Sym));
break;
case SHT_STRTAB:
if(!strcmp(shstr+sh->sh_name,".dynstr")) {
ctx->dynstr = malloc(sh->sh_size);
memcpy(ctx->dynstr, ((void *) elf) + sh->sh_offset, sh->sh_size);
}else if(!strcmp(shstr+sh->sh_name,".strtab")) {
ctx->strtab = malloc(sh->sh_size);
memcpy(ctx->strtab, ((void *) elf) + sh->sh_offset, sh->sh_size);
}
break;
case SHT_PROGBITS:
if (!ctx->dynstr || !ctx->dynsym || ctx->bias) break;
ctx->bias = (off_t) sh->sh_addr - (off_t) sh->sh_offset;
break;
}
}
複製代碼
void *enhanced_dlsym(void *handle, const char *name) {
int k;
struct ctx *ctx = (struct ctx *) handle;
Elf_Sym *dynsym = (Elf_Sym *) ctx->dynsym;
Elf_Sym *symtab = (Elf_Sym *) ctx->symtab;
char *dynstr = (char *) ctx->dynstr;
char *strtab = (char *) ctx->strtab;
for (k = 0; k < ctx->dynsym_num; k++, dynsym++) {
if (strcmp(dynstr + dynsym->st_name, name) == 0) {
void *ret = ctx->load_addr + dynsym->st_value - ctx->bias;
log_info("%s found at %p", name, ret);
return ret;
}
}
if(symtab) {
for (k = 0; k < ctx->symtab_num; k++, symtab++) {
sym_tab->st_name,strings + sym_tab->st_name,k);
if (strcmp(strtab + symtab->st_name, name) == 0) {
void *ret = ctx->load_addr + symtab->st_value - ctx->bias;
log_info("%s found at %p", name, ret);
return ret;
}
}
}
return 0;
}
複製代碼
1. 先查詢.dynsym段。遍歷.dymsym全部符號,查找符號名與給定字符串一致的符號。用load_addr、bias結合符號偏移來獲取實際地址。post
for (k = 0; k < ctx->dynsym_num; k++, dynsym++) {
if (strcmp(dynstr + dynsym->st_name, name) == 0) {
void *ret = ctx->load_addr + dynsym->st_value - ctx->bias;
log_info("%s found at %p", name, ret);
return ret;
}
}
複製代碼
2. 若是.dynsym段找不到目標符號且.symtab段存在時,遍歷.symtab全部符號,查找符號名與給定字符串一致的符號。用load_addr、bias結合符號偏移來獲取實際地址。ui
for (k = 0; k < ctx->symtab_num; k++, symtab++) {
sym_tab->st_name,strings + sym_tab->st_name,k);
if (strcmp(strtab + symtab->st_name, name) == 0) {
void *ret = ctx->load_addr + symtab->st_value - ctx->bias;
log_info("%s found at %p", name, ret);
return ret;
}
}
複製代碼
Nougat_dlfunctions只支持arm平臺,而我在實際工做中也不涉及到x86平臺,因此Enhanced dlfunctions暫時只支持arm32和arm64,若是要兼容x86等其餘平臺也不難,不須要改實現,主要就是elf.h一些結構體的不一樣。spa