/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│ │vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│ ╞══════════════════════════════════════════════════════════════════════════════╡ │ Copyright 2020 Justine Alexandra Roberts Tunney │ │ │ │ This program is free software; you can redistribute it and/or modify │ │ it under the terms of the GNU General Public License as published by │ │ the Free Software Foundation; version 2 of the License. │ │ │ │ This program is distributed in the hope that it will be useful, but │ │ WITHOUT ANY WARRANTY; without even the implied warranty of │ │ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU │ │ General Public License for more details. │ │ │ │ You should have received a copy of the GNU General Public License │ │ along with this program; if not, write to the Free Software │ │ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA │ │ 02110-1301 USA │ ╚─────────────────────────────────────────────────────────────────────────────*/ #include "libc/assert.h" #include "libc/bits/bits.h" #include "libc/conv/itoa.h" #include "libc/limits.h" #include "libc/log/check.h" #include "libc/macros.h" #include "libc/str/str.h" #include "tool/build/lib/demangle.h" #include "tool/build/lib/dis.h" #include "tool/build/lib/endian.h" #include "tool/build/lib/high.h" #include "tool/build/lib/modrm.h" static const char kRiz[2][4] = {"eiz", "riz"}; static const char kRip[2][4] = {"eip", "rip"}; static const char kSka[4][4] = {"", ",2", ",4", ",8"}; static const char kSeg[8][3] = {"es", "cs", "ss", "ds", "fs", "gs"}; static const char kCtl[8][4] = {"cr0", "wut", "cr2", "cr3", "cr4", "wut", "wut", "wut"}; static const char kBreg[2][2][8][5] = { {{"al", "cl", "dl", "bl", "ah", "ch", "dh", "bh"}, {"al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil"}}, {{"wut", "wut", "wut", "wut", "wut", "wut", "wut", "wut"}, {"r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b"}}, }; static const char kGreg[2][2][2][8][5] = { {{{"eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi"}, {"r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d"}}, {{"rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi"}, {"r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"}}}, {{{"ax", "cx", "dx", "bx", "sp", "bp", "si", "di"}, {"r8w", "re9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w"}}, {{"rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi"}, {"r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15"}}}, }; static int64_t RipRelative(struct Dis *d, int64_t i) { return d->addr + d->xedd->length + i; } static int64_t ZeroExtend(uint32_t rde, int64_t i) { switch (Mode(rde)) { case XED_MODE_REAL: return i & 0xffff; case XED_MODE_LEGACY: return i & 0xffffffff; default: return i; } } static int64_t Unrelative(uint32_t rde, int64_t i) { switch (Eamode(rde)) { case XED_MODE_REAL: return i & 0xffff; case XED_MODE_LEGACY: return i & 0xffffffff; default: return i; } } static int64_t GetSeg(struct Dis *d, uint32_t rde, unsigned char *s) { switch (Sego(rde) ? Sego(rde) : d->xedd->op.hint) { default: return Read64(s); case 1: return Read64(d->m->es); case 2: return Read64(d->m->cs); case 3: return Read64(d->m->ss); case 4: return Read64(d->m->ds); } } static const char *GetAddrReg(struct Dis *d, uint32_t rde, uint8_t x, uint8_t r) { return kGreg[Eamode(rde) == XED_MODE_REAL][Eamode(rde) == XED_MODE_LONG] [x & 1][r & 7]; } static char *DisRegister(char *p, const char *s) { p = HighStart(p, g_high.reg); *p++ = '%'; p = stpcpy(p, s); p = HighEnd(p); return p; } static char *DisComment(char *p, const char *s) { p = HighStart(p, g_high.comment); p = stpcpy(p, s); p = HighEnd(p); return p; } static char *DisRegisterByte(struct Dis *d, uint32_t rde, char *p, bool g, int r) { return DisRegister(p, kBreg[g][Rex(rde)][r]); } static char *DisRegisterWord(struct Dis *d, uint32_t rde, char *p, bool g, int r) { return DisRegister(p, kGreg[Osz(rde)][Rexw(rde)][g][r]); } static char *DisInt(char *p, int64_t x) { if (-15 <= x && x <= 15) { p += int64toarray_radix10(x, p); } else if (x == INT64_MIN) { p = stpcpy(p, "-0x"); p += uint64toarray_radix16(INT64_MIN, p); } else if (x < 0 && -x < 0xFFFFFFFF) { p = stpcpy(p, "-0x"); p += uint64toarray_radix16(-x, p); } else { p = stpcpy(p, "0x"); p += uint64toarray_radix16(x, p); } return p; } static char *DisSymImpl(struct Dis *d, char *p, int64_t x, long sym) { int64_t addend; const char *name; addend = x - d->syms.p[sym].addr; name = d->syms.stab + d->syms.p[sym].name; p = Demangle(p, name, DIS_MAX_SYMBOL_LENGTH); if (addend) { *p++ = '+'; p = DisInt(p, addend); } return p; } static char *DisSym(struct Dis *d, char *p, int64_t x1, int64_t x2, bool isrelative) { long sym; if ((sym = DisFindSym(d, x2)) != -1 && d->syms.p[sym].name && (d->syms.p[sym].isabs ^ isrelative)) { return DisSymImpl(d, p, x2, sym); } else if ((sym = DisFindSym(d, x1)) != -1 && d->syms.p[sym].name && (d->syms.p[sym].isabs ^ isrelative)) { return DisSymImpl(d, p, x1, sym); } else { return DisInt(p, x1); } } static char *DisSymLiteral(struct Dis *d, uint32_t rde, char *p, uint64_t addr, uint64_t ip) { *p++ = '$'; p = HighStart(p, g_high.literal); p = DisSym(d, p, addr, addr, false); p = HighEnd(p); return p; } static char *DisGvqp(struct Dis *d, uint32_t rde, char *p) { return DisRegisterWord(d, rde, p, Rexr(rde), ModrmReg(rde)); } static char *DisGdqp(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kGreg[0][Rexw(rde)][Rexr(rde)][ModrmReg(rde)]); } static char *DisGb(struct Dis *d, uint32_t rde, char *p) { return DisRegisterByte(d, rde, p, Rexr(rde), ModrmReg(rde)); } static char *DisSego(struct Dis *d, uint32_t rde, char *p) { int seg; seg = Sego(rde) ? Sego(rde) : d->xedd->op.hint; if (seg) { p = DisRegister(p, kSeg[seg - 1]); *p++ = ':'; } return p; } static bool IsRealModrmAbsolute(uint32_t rde) { return Eamode(rde) == XED_MODE_REAL && ModrmRm(rde) == 6 && !ModrmMod(rde); } static char *DisDisp(struct Dis *d, uint32_t rde, char *p) { bool rela; int64_t disp; if (ModrmMod(rde) == 0b01 || ModrmMod(rde) == 0b10 || IsRipRelative(rde) || IsRealModrmAbsolute(rde) || (Eamode(rde) != XED_MODE_REAL && ModrmMod(rde) == 0b00 && ModrmRm(rde) == 0b100 && SibBase(d->xedd) == 0b101)) { disp = d->xedd->op.disp; if (IsRipRelative(rde)) { if (Mode(rde) == XED_MODE_LONG) { disp = RipRelative(d, disp); rela = true; } else { disp = Unrelative(rde, disp); rela = false; } } else if (IsRealModrmAbsolute(rde)) { disp = Unrelative(rde, disp); rela = false; } else { rela = true; } p = DisSym(d, p, disp, disp, rela); } return p; } static char *DisBis(struct Dis *d, uint32_t rde, char *p) { const char *base, *index, *scale; base = index = scale = NULL; if (Eamode(rde) != XED_MODE_REAL) { if (!SibExists(rde)) { DCHECK(!d->xedd->op.has_sib); if (IsRipRelative(rde)) { if (Mode(rde) == XED_MODE_LONG) { base = kRip[Eamode(rde) == XED_MODE_LONG]; } } else { base = GetAddrReg(d, rde, Rexb(rde), ModrmRm(rde)); } } else if (!SibIsAbsolute(d->xedd, rde)) { if (SibHasBase(d->xedd, rde)) { base = GetAddrReg(d, rde, Rexb(rde), SibBase(d->xedd)); } if (SibHasIndex(d->xedd)) { index = GetAddrReg(d, rde, Rexx(d->xedd), SibIndex(d->xedd)); } else if (d->xedd->op.scale) { index = kRiz[Eamode(rde) == XED_MODE_LONG]; } scale = kSka[d->xedd->op.scale]; } } else { switch (ModrmRm(rde)) { case 0: base = "bx"; index = "si"; break; case 1: base = "bx"; index = "di"; break; case 2: base = "bp"; index = "si"; break; case 3: base = "bp"; index = "di"; break; case 4: base = "si"; break; case 5: base = "di"; break; case 6: if (ModrmMod(rde)) base = "bp"; break; case 7: base = "bx"; break; default: unreachable; } } if (base || index) { *p++ = '('; if (base) { p = DisRegister(p, base); } if (index) { *p++ = ','; p = DisRegister(p, index); if (scale) { p = stpcpy(p, scale); } } *p++ = ')'; } *p = '\0'; return p; } static char *DisM(struct Dis *d, uint32_t rde, char *p) { p = DisSego(d, rde, p); p = DisDisp(d, rde, p); p = DisBis(d, rde, p); return p; } static char *DisRegMem(struct Dis *d, uint32_t rde, char *p, char *f(struct Dis *, uint32_t, char *)) { if (IsModrmRegister(rde)) { return f(d, rde, p); } else { return DisM(d, rde, p); } } static noinline char *DisE(struct Dis *d, uint32_t rde, char *p, char *f(struct Dis *, uint32_t, char *, bool, int)) { if (IsModrmRegister(rde)) { return f(d, rde, p, Rexb(rde), ModrmRm(rde)); } else { return DisM(d, rde, p); } } static char *DisEb(struct Dis *d, uint32_t rde, char *p) { return DisE(d, rde, p, DisRegisterByte); } static char *DisEvqp(struct Dis *d, uint32_t rde, char *p) { return DisE(d, rde, p, DisRegisterWord); } static char *DisEdqpReg(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kGreg[0][Rexw(rde)][Rexb(rde)][ModrmRm(rde)]); } static char *DisEdqp(struct Dis *d, uint32_t rde, char *p) { return DisRegMem(d, rde, p, DisEdqpReg); } static char *DisEvReg(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kGreg[Osz(rde)][0][Rexb(rde)][ModrmRm(rde)]); } static char *DisEv(struct Dis *d, uint32_t rde, char *p) { return DisRegMem(d, rde, p, DisEvReg); } static char *DisGvq(struct Dis *d, uint32_t rde, char *p, int r) { const char *s; if (Mode(rde) == XED_MODE_LONG) { s = kGreg[Osz(rde)][!Osz(rde)][Rexb(rde)][r]; } else { s = kGreg[Osz(rde)][0][Rexb(rde)][r]; } return DisRegister(p, s); } static char *DisZvq(struct Dis *d, uint32_t rde, char *p) { return DisGvq(d, rde, p, ModrmSrm(rde)); } static char *DisEvqReg(struct Dis *d, uint32_t rde, char *p) { return DisGvq(d, rde, p, ModrmRm(rde)); } static char *DisEvq(struct Dis *d, uint32_t rde, char *p) { return DisRegMem(d, rde, p, DisEvqReg); } static char *DisEdReg(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kGreg[0][0][Rexb(rde)][ModrmRm(rde)]); } static char *DisEd(struct Dis *d, uint32_t rde, char *p) { return DisRegMem(d, rde, p, DisEdReg); } static char *DisEqReg(struct Dis *d, uint32_t rde, char *p) { const char *r; if (Mode(rde) == XED_MODE_LONG) { r = kGreg[0][1][Rexb(rde)][ModrmRm(rde)]; } else { r = kGreg[Osz(rde)][0][Rexb(rde)][ModrmRm(rde)]; } return DisRegister(p, r); } static char *DisEq(struct Dis *d, uint32_t rde, char *p) { return DisRegMem(d, rde, p, DisEqReg); } static char *DisZvqp(struct Dis *d, uint32_t rde, char *p) { return DisRegisterWord(d, rde, p, Rexb(rde), ModrmSrm(rde)); } static char *DisZb(struct Dis *d, uint32_t rde, char *p) { return DisRegisterByte(d, rde, p, Rexb(rde), ModrmSrm(rde)); } static char *DisEax(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kGreg[Osz(rde)][0][0][0]); } static char *DisRax(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kGreg[Osz(rde)][Rexw(rde)][0][0]); } static char *DisRdx(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kGreg[Osz(rde)][Rexw(rde)][0][2]); } static char *DisCd(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kCtl[ModrmReg(rde)]); } static char *DisHd(struct Dis *d, uint32_t rde, char *p) { return DisRegister(p, kGreg[0][Mode(rde) == XED_MODE_LONG][0][ModrmRm(rde)]); } static char *DisImm(struct Dis *d, uint32_t rde, char *p) { return DisSymLiteral(d, rde, p, d->xedd->op.uimm0, ZeroExtend(rde, d->xedd->op.uimm0)); } static char *DisRvds(struct Dis *d, uint32_t rde, char *p) { return DisSymLiteral(d, rde, p, d->xedd->op.disp, d->xedd->op.disp); } static char *DisKpvds(struct Dis *d, uint32_t rde, char *p, uint64_t x) { *p++ = '$'; p = HighStart(p, g_high.literal); p = DisInt(p, x); p = HighEnd(p); return p; } static char *DisKvds(struct Dis *d, uint32_t rde, char *p) { return DisKpvds(d, rde, p, d->xedd->op.uimm0); } static char *DisPvds(struct Dis *d, uint32_t rde, char *p) { return DisKpvds(d, rde, p, d->xedd->op.disp & (Osz(rde) ? 0xffff : 0xffffffff)); } static char *DisOne(struct Dis *d, uint32_t rde, char *p) { *p++ = '$'; p = HighStart(p, g_high.literal); p = stpcpy(p, "1"); p = HighEnd(p); return p; } static char *DisJbs(struct Dis *d, uint32_t rde, char *p) { if (d->xedd->op.disp > 0) *p++ = '+'; p += int64toarray_radix10(d->xedd->op.disp, p); return p; } static char *DisJb(struct Dis *d, uint32_t rde, char *p) { if (d->xedd->op.disp > 0) *p++ = '+'; p += uint64toarray_radix10(d->xedd->op.disp & 0xff, p); return p; } static char *DisJvds(struct Dis *d, uint32_t rde, char *p) { return DisSym(d, p, RipRelative(d, d->xedd->op.disp), RipRelative(d, d->xedd->op.disp) - Read64(d->m->cs), true); } static char *DisAbs(struct Dis *d, uint32_t rde, char *p) { return DisSym(d, p, d->xedd->op.disp, d->xedd->op.disp, false); } static char *DisSw(struct Dis *d, uint32_t rde, char *p) { if (kSeg[ModrmReg(rde)][0]) p = DisRegister(p, kSeg[ModrmReg(rde)]); return p; } static char *DisSpecialAddr(struct Dis *d, uint32_t rde, char *p, int r) { *p++ = '('; p = DisRegister(p, GetAddrReg(d, rde, 0, r)); *p++ = ')'; *p = '\0'; return p; } static char *DisY(struct Dis *d, uint32_t rde, char *p) { return DisSpecialAddr(d, rde, p, 7); // es:di } static char *DisX(struct Dis *d, uint32_t rde, char *p) { p = DisSego(d, rde, p); return DisSpecialAddr(d, rde, p, 6); // ds:si } static char *DisBBb(struct Dis *d, uint32_t rde, char *p) { p = DisSego(d, rde, p); return DisSpecialAddr(d, rde, p, 3); // ds:bx } static char *DisXmm(struct Dis *d, uint32_t rde, char *p, const char *s, int reg) { p = HighStart(p, g_high.reg); *p++ = '%'; p = stpcpy(p, s); p += uint64toarray_radix10(reg, p); p = HighEnd(p); return p; } static char *DisNq(struct Dis *d, uint32_t rde, char *p) { return DisXmm(d, rde, p, "mm", ModrmRm(rde)); } static char *DisPq(struct Dis *d, uint32_t rde, char *p) { return DisXmm(d, rde, p, "mm", ModrmReg(rde)); } static char *DisUq(struct Dis *d, uint32_t rde, char *p) { return DisXmm(d, rde, p, "xmm", RexbRm(rde)); } static char *DisUdq(struct Dis *d, uint32_t rde, char *p) { return DisXmm(d, rde, p, "xmm", RexbRm(rde)); } static char *DisVdq(struct Dis *d, uint32_t rde, char *p) { return DisXmm(d, rde, p, "xmm", RexrReg(rde)); } static char *DisQq(struct Dis *d, uint32_t rde, char *p) { return DisRegMem(d, rde, p, DisNq); } static char *DisEst(struct Dis *d, uint32_t rde, char *p) { p = DisRegister(p, "st"); if (ModrmRm(rde) != 0) { *p++ = '('; *p++ = '0' + ModrmRm(rde); *p++ = ')'; *p = '\0'; } return p; } static char *DisEst1(struct Dis *d, uint32_t rde, char *p) { if (ModrmRm(rde) != 1) { p = DisEst(d, rde, p); } else { *p = '\0'; } return p; } static char *DisEssr(struct Dis *d, uint32_t rde, char *p) { return DisRegMem(d, rde, p, DisEst); } static char *DisWps(struct Dis *d, uint32_t rde, char *p) { return DisRegMem(d, rde, p, DisUdq); } #define DisEdr DisM #define DisEqp DisEq #define DisEsr DisM #define DisGv DisGvqp #define DisIb DisImm #define DisIbs DisImm #define DisIbss DisImm #define DisIvds DisImm #define DisIvqp DisImm #define DisIvs DisImm #define DisIw DisImm #define DisMdi DisM #define DisMdq DisM #define DisMdqp DisM #define DisMdr DisM #define DisMe DisM #define DisMer DisM #define DisMp DisM #define DisMps DisM #define DisMq DisM #define DisMqi DisM #define DisMs DisM #define DisMsr DisEssr #define DisMw DisM #define DisMwi DisM #define DisOb DisAbs #define DisOvqp DisAbs #define DisPpi DisPq #define DisQpi DisQq #define DisRdqp DisGdqp #define DisRvqp DisGvqp #define DisVpd DisVdq #define DisVps DisVdq #define DisVq DisVdq #define DisVsd DisVdq #define DisVss DisVdq #define DisWdq DisWps #define DisWpd DisWps #define DisWpsq DisWps #define DisWq DisWps #define DisWsd DisWps #define DisWss DisWps #define DisXb DisX #define DisXv DisX #define DisXvqp DisX #define DisYb DisY #define DisYv DisY #define DisYvqp DisY #define DisZv DisZvqp static const struct DisArg { char s[8]; char *(*f)(struct Dis *, uint32_t, char *); } kDisArgs[] = /* */ { {"$1", DisOne}, // {"%Cd", DisCd}, // {"%Gb", DisGb}, // {"%Gdqp", DisGdqp}, // {"%Gv", DisGv}, // {"%Gvqp", DisGvqp}, // {"%Hd", DisHd}, // {"%Nq", DisNq}, // {"%Ppi", DisPpi}, // {"%Pq", DisPq}, // {"%Rdqp", DisRdqp}, // {"%Rvqp", DisRvqp}, // {"%Sw", DisSw}, // {"%Udq", DisUdq}, // {"%Uq", DisUq}, // {"%Vdq", DisVdq}, // {"%Vpd", DisVpd}, // {"%Vps", DisVps}, // {"%Vq", DisVq}, // {"%Vsd", DisVsd}, // {"%Vss", DisVss}, // {"%Zb", DisZb}, // {"%Zv", DisZv}, // {"%Zvq", DisZvq}, // {"%Zvqp", DisZvqp}, // {"%eAX", DisEax}, // {"%rAX", DisRax}, // {"%rDX", DisRdx}, // {"BBb", DisBBb}, // {"EST", DisEst}, // {"EST1", DisEst1}, // {"ESsr", DisEssr}, // {"Eb", DisEb}, // {"Ed", DisEd}, // {"Edqp", DisEdqp}, // {"Edr", DisEdr}, // {"Eq", DisEq}, // {"Eqp", DisEqp}, // {"Esr", DisEsr}, // {"Ev", DisEv}, // {"Evq", DisEvq}, // {"Evqp", DisEvqp}, // {"Ew", DisEvqp}, // {"Ib", DisIb}, // {"Ibs", DisIbs}, // {"Ibss", DisIbss}, // {"Ivds", DisIvds}, // {"Ivqp", DisIvqp}, // {"Ivs", DisIvs}, // {"Iw", DisIw}, // {"Jb", DisJb}, // {"Jbs", DisJbs}, // {"Jvds", DisJvds}, // {"Kvds", DisKvds}, // {"M", DisM}, // {"Mdi", DisMdi}, // {"Mdq", DisMdq}, // {"Mdqp", DisMdqp}, // {"Mdr", DisMdr}, // {"Me", DisMe}, // {"Mer", DisMer}, // {"Mp", DisMp}, // {"Mps", DisMps}, // {"Mq", DisMq}, // {"Mqi", DisMqi}, // {"Ms", DisMs}, // {"Msr", DisMsr}, // {"Mw", DisMw}, // {"Mwi", DisMwi}, // {"Ob", DisOb}, // {"Ovqp", DisOvqp}, // {"Pvds", DisPvds}, // {"Qpi", DisQpi}, // {"Qq", DisQq}, // {"Rvds", DisRvds}, // {"Wdq", DisWdq}, // {"Wpd", DisWpd}, // {"Wps", DisWps}, // {"Wpsq", DisWpsq}, // {"Wq", DisWq}, // {"Wsd", DisWsd}, // {"Wss", DisWss}, // {"Xb", DisXb}, // {"Xv", DisXv}, // {"Xvqp", DisXvqp}, // {"Yb", DisYb}, // {"Yv", DisYv}, // {"Yvqp", DisYvqp}, // }; static int CompareString8(const char a[8], const char b[8]) { uint64_t x, y; x = READ64BE(a); y = READ64BE(b); return x > y ? 1 : x < y ? -1 : 0; } char *DisArg(struct Dis *d, char *p, const char *s) { char key[8]; int c, m, l, r; l = 0; r = ARRAYLEN(kDisArgs) - 1; strncpy(key, s, 8); while (l <= r) { m = (l + r) >> 1; c = CompareString8(kDisArgs[m].s, key); if (c < 0) { l = m + 1; } else if (c > 0) { r = m - 1; } else { return kDisArgs[m].f(d, d->xedd->op.rde, p); } } if (*s == '%') { p = DisRegister(p, s + 1); } else { p = stpcpy(p, s); } return p; }