2020-08-25 11:23:25 +00:00
|
|
|
/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
|
|
|
|
│vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│
|
|
|
|
╞══════════════════════════════════════════════════════════════════════════════╡
|
|
|
|
│ Copyright 2020 Justine Alexandra Roberts Tunney │
|
|
|
|
│ │
|
|
|
|
│ This program is free software; you can redistribute it and/or modify │
|
|
|
|
│ it under the terms of the GNU General Public License as published by │
|
|
|
|
│ the Free Software Foundation; version 2 of the License. │
|
|
|
|
│ │
|
|
|
|
│ This program is distributed in the hope that it will be useful, but │
|
|
|
|
│ WITHOUT ANY WARRANTY; without even the implied warranty of │
|
|
|
|
│ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU │
|
|
|
|
│ General Public License for more details. │
|
|
|
|
│ │
|
|
|
|
│ You should have received a copy of the GNU General Public License │
|
|
|
|
│ along with this program; if not, write to the Free Software │
|
|
|
|
│ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA │
|
|
|
|
│ 02110-1301 USA │
|
|
|
|
╚─────────────────────────────────────────────────────────────────────────────*/
|
|
|
|
#include "libc/alg/alg.h"
|
|
|
|
#include "libc/elf/elf.h"
|
|
|
|
#include "libc/elf/struct/sym.h"
|
|
|
|
#include "libc/log/check.h"
|
2020-10-06 06:11:49 +00:00
|
|
|
#include "libc/log/log.h"
|
2020-09-07 04:39:00 +00:00
|
|
|
#include "libc/macros.h"
|
2020-10-27 10:39:46 +00:00
|
|
|
#include "libc/mem/mem.h"
|
2020-10-06 06:11:49 +00:00
|
|
|
#include "libc/str/str.h"
|
2020-08-25 11:23:25 +00:00
|
|
|
#include "tool/build/lib/dis.h"
|
|
|
|
|
2020-10-06 06:11:49 +00:00
|
|
|
bool g_disisprog_disable;
|
|
|
|
|
2020-08-25 11:23:25 +00:00
|
|
|
static int DisSymCompare(const struct DisSym *a, const struct DisSym *b) {
|
|
|
|
if (a->addr != b->addr) {
|
|
|
|
if (a->addr < b->addr) return -1;
|
|
|
|
if (a->addr > b->addr) return +1;
|
|
|
|
}
|
|
|
|
if (a->rank != b->rank) {
|
|
|
|
if (a->rank > b->rank) return -1;
|
|
|
|
if (a->rank < b->rank) return +1;
|
|
|
|
}
|
|
|
|
if (a->unique != b->unique) {
|
|
|
|
if (a->unique < b->unique) return -1;
|
|
|
|
if (a->unique > b->unique) return +1;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void DisLoadElfLoads(struct Dis *d, struct Elf *elf) {
|
2020-10-27 10:39:46 +00:00
|
|
|
long i, j, n;
|
2020-08-25 11:23:25 +00:00
|
|
|
int64_t addr;
|
|
|
|
uint64_t size;
|
|
|
|
Elf64_Phdr *phdr;
|
2020-10-27 10:39:46 +00:00
|
|
|
j = 0;
|
|
|
|
n = elf->ehdr->e_phnum;
|
|
|
|
if (d->loads.n < n) {
|
|
|
|
d->loads.n = n;
|
|
|
|
d->loads.p = realloc(d->loads.p, d->loads.n * sizeof(*d->loads.p));
|
|
|
|
CHECK_NOTNULL(d->loads.p);
|
|
|
|
}
|
|
|
|
for (i = 0; i < n; ++i) {
|
2020-08-25 11:23:25 +00:00
|
|
|
phdr = getelfsegmentheaderaddress(elf->ehdr, elf->size, i);
|
|
|
|
if (phdr->p_type != PT_LOAD) continue;
|
2020-10-27 10:39:46 +00:00
|
|
|
d->loads.p[j].addr = phdr->p_vaddr;
|
|
|
|
d->loads.p[j].size = phdr->p_memsz;
|
|
|
|
d->loads.p[j].istext = (phdr->p_flags & PF_X) == PF_X;
|
|
|
|
++j;
|
2020-08-25 11:23:25 +00:00
|
|
|
}
|
2020-10-27 10:39:46 +00:00
|
|
|
d->loads.i = j;
|
2020-08-25 11:23:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static void DisLoadElfSyms(struct Dis *d, struct Elf *elf) {
|
2020-10-27 10:39:46 +00:00
|
|
|
size_t i, j, n;
|
2020-08-25 11:23:25 +00:00
|
|
|
int64_t stablen;
|
|
|
|
const Elf64_Sym *st, *sym;
|
|
|
|
bool isabs, iscode, isweak, islocal, ishidden, isprotected, isfunc, isobject;
|
2020-10-27 10:39:46 +00:00
|
|
|
j = 0;
|
2020-08-25 11:23:25 +00:00
|
|
|
if ((d->syms.stab = getelfstringtable(elf->ehdr, elf->size)) &&
|
|
|
|
(st = getelfsymboltable(elf->ehdr, elf->size, &n))) {
|
|
|
|
stablen = (intptr_t)elf->ehdr + elf->size - (intptr_t)d->syms.stab;
|
2020-10-27 10:39:46 +00:00
|
|
|
if (d->syms.n < n) {
|
|
|
|
d->syms.n = n;
|
|
|
|
d->syms.p = realloc(d->syms.p, d->syms.n * sizeof(*d->syms.p));
|
|
|
|
CHECK_NOTNULL(d->syms.p);
|
|
|
|
}
|
2020-08-25 11:23:25 +00:00
|
|
|
for (i = 0; i < n; ++i) {
|
2020-10-27 10:39:46 +00:00
|
|
|
if (ELF64_ST_TYPE(st[i].st_info) == STT_SECTION ||
|
|
|
|
ELF64_ST_TYPE(st[i].st_info) == STT_FILE || !st[i].st_name ||
|
|
|
|
startswith(d->syms.stab + st[i].st_name, "v_") ||
|
|
|
|
!(0 <= st[i].st_name && st[i].st_name < stablen) || !st[i].st_value ||
|
|
|
|
!(-0x800000000000 <= (int64_t)st[i].st_value &&
|
|
|
|
(int64_t)st[i].st_value < 0x800000000000)) {
|
|
|
|
continue;
|
|
|
|
}
|
2020-08-25 11:23:25 +00:00
|
|
|
isabs = st[i].st_shndx == SHN_ABS;
|
|
|
|
isweak = ELF64_ST_BIND(st[i].st_info) == STB_WEAK;
|
|
|
|
islocal = ELF64_ST_BIND(st[i].st_info) == STB_LOCAL;
|
|
|
|
ishidden = st[i].st_other == STV_HIDDEN;
|
|
|
|
isprotected = st[i].st_other == STV_PROTECTED;
|
|
|
|
isfunc = ELF64_ST_TYPE(st[i].st_info) == STT_FUNC;
|
|
|
|
isobject = ELF64_ST_TYPE(st[i].st_info) == STT_OBJECT;
|
2020-10-27 10:39:46 +00:00
|
|
|
d->syms.p[j].unique = i;
|
|
|
|
d->syms.p[j].size = st[i].st_size;
|
|
|
|
d->syms.p[j].name = st[i].st_name;
|
|
|
|
d->syms.p[j].addr = st[i].st_value;
|
|
|
|
d->syms.p[j].rank =
|
|
|
|
-islocal + -isweak + -isabs + isprotected + isobject + isfunc;
|
|
|
|
d->syms.p[j].iscode = DisIsText(d, st[i].st_value) ? !isobject : isfunc;
|
|
|
|
d->syms.p[j].isabs = isabs;
|
|
|
|
++j;
|
2020-08-25 11:23:25 +00:00
|
|
|
}
|
|
|
|
}
|
2020-10-27 10:39:46 +00:00
|
|
|
d->syms.i = j;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void DisSortSyms(struct Dis *d) {
|
2020-08-25 11:23:25 +00:00
|
|
|
qsort(d->syms.p, d->syms.i, sizeof(struct DisSym), (void *)DisSymCompare);
|
|
|
|
}
|
|
|
|
|
2020-10-27 10:39:46 +00:00
|
|
|
static void DisCanonizeSyms(struct Dis *d) {
|
|
|
|
int64_t i, j, a;
|
|
|
|
if (d->syms.i) {
|
|
|
|
i = 1;
|
|
|
|
j = 1;
|
|
|
|
a = d->syms.p[0].addr;
|
|
|
|
do {
|
|
|
|
if (d->syms.p[j].addr > a) {
|
|
|
|
a = d->syms.p[j].addr;
|
|
|
|
if (j > i) {
|
|
|
|
d->syms.p[i] = d->syms.p[j];
|
|
|
|
}
|
|
|
|
++i;
|
|
|
|
}
|
|
|
|
++j;
|
|
|
|
} while (j < d->syms.i);
|
|
|
|
d->syms.p = realloc(d->syms.p, sizeof(*d->syms.p) * i);
|
|
|
|
d->syms.i = i;
|
|
|
|
d->syms.n = i;
|
|
|
|
}
|
|
|
|
for (i = 0; i < d->syms.i; ++i) {
|
|
|
|
DEBUGF("%p-%p %s", d->syms.p[i].addr,
|
|
|
|
d->syms.p[i].addr + (d->syms.p[i].size ? d->syms.p[i].size - 1 : 0),
|
|
|
|
d->syms.stab + d->syms.p[i].name);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-08-25 11:23:25 +00:00
|
|
|
bool DisIsProg(struct Dis *d, int64_t addr) {
|
|
|
|
long i;
|
2020-10-06 06:11:49 +00:00
|
|
|
if (g_disisprog_disable) return true;
|
2020-08-25 11:23:25 +00:00
|
|
|
for (i = 0; i < d->loads.i; ++i) {
|
|
|
|
if (addr >= d->loads.p[i].addr &&
|
|
|
|
addr < d->loads.p[i].addr + d->loads.p[i].size) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool DisIsText(struct Dis *d, int64_t addr) {
|
|
|
|
long i;
|
|
|
|
for (i = 0; i < d->loads.i; ++i) {
|
|
|
|
if (addr >= d->loads.p[i].addr &&
|
|
|
|
addr < d->loads.p[i].addr + d->loads.p[i].size) {
|
|
|
|
return d->loads.p[i].istext;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
long DisFindSym(struct Dis *d, int64_t addr) {
|
2020-10-27 10:39:46 +00:00
|
|
|
long l, r, m, n;
|
|
|
|
if (DisIsProg(d, addr)) {
|
|
|
|
l = 0;
|
|
|
|
r = d->syms.i;
|
|
|
|
while (l < r) {
|
|
|
|
m = (l + r) >> 1;
|
|
|
|
if (d->syms.p[m].addr > addr) {
|
|
|
|
r = m;
|
|
|
|
} else {
|
|
|
|
l = m + 1;
|
2020-08-25 11:23:25 +00:00
|
|
|
}
|
|
|
|
}
|
2020-10-27 10:39:46 +00:00
|
|
|
if (r && (addr == d->syms.p[r - 1].addr ||
|
|
|
|
(addr > d->syms.p[r - 1].addr &&
|
|
|
|
(addr <= d->syms.p[r - 1].addr + d->syms.p[r - 1].size ||
|
|
|
|
!d->syms.p[r - 1].size)))) {
|
|
|
|
return r - 1;
|
|
|
|
}
|
2020-08-25 11:23:25 +00:00
|
|
|
}
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
long DisFindSymByName(struct Dis *d, const char *s) {
|
|
|
|
long i;
|
|
|
|
for (i = 0; i < d->syms.i; ++i) {
|
|
|
|
if (strcmp(s, d->syms.stab + d->syms.p[i].name) == 0) {
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
void DisLoadElf(struct Dis *d, struct Elf *elf) {
|
|
|
|
if (!elf || !elf->ehdr) return;
|
|
|
|
DisLoadElfLoads(d, elf);
|
|
|
|
DisLoadElfSyms(d, elf);
|
2020-10-27 10:39:46 +00:00
|
|
|
DisSortSyms(d);
|
|
|
|
DisCanonizeSyms(d);
|
2020-08-25 11:23:25 +00:00
|
|
|
}
|