2020-08-25 11:23:25 +00:00
|
|
|
/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
|
|
|
|
│vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│
|
|
|
|
╞══════════════════════════════════════════════════════════════════════════════╡
|
|
|
|
│ Copyright 2020 Justine Alexandra Roberts Tunney │
|
|
|
|
│ │
|
|
|
|
│ This program is free software; you can redistribute it and/or modify │
|
|
|
|
│ it under the terms of the GNU General Public License as published by │
|
|
|
|
│ the Free Software Foundation; version 2 of the License. │
|
|
|
|
│ │
|
|
|
|
│ This program is distributed in the hope that it will be useful, but │
|
|
|
|
│ WITHOUT ANY WARRANTY; without even the implied warranty of │
|
|
|
|
│ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU │
|
|
|
|
│ General Public License for more details. │
|
|
|
|
│ │
|
|
|
|
│ You should have received a copy of the GNU General Public License │
|
|
|
|
│ along with this program; if not, write to the Free Software │
|
|
|
|
│ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA │
|
|
|
|
│ 02110-1301 USA │
|
|
|
|
╚─────────────────────────────────────────────────────────────────────────────*/
|
|
|
|
#include "libc/log/check.h"
|
|
|
|
#include "libc/nexgen32e/tinystrcmp.h"
|
|
|
|
#include "libc/str/str.h"
|
2020-10-06 06:11:49 +00:00
|
|
|
#include "third_party/zlib/zlib.h"
|
2020-08-25 11:23:25 +00:00
|
|
|
#include "tool/build/lib/dis.h"
|
2020-09-28 08:13:56 +00:00
|
|
|
#include "tool/build/lib/high.h"
|
2020-08-25 11:23:25 +00:00
|
|
|
#include "tool/build/lib/modrm.h"
|
|
|
|
|
2020-09-07 04:39:00 +00:00
|
|
|
static const char kJcxz[3][6] = {"jcxz", "jecxz", "jrcxz"};
|
2020-08-25 11:23:25 +00:00
|
|
|
static const char kAluOp[8][4] = {"add", "or", "adc", "sbb",
|
|
|
|
"and", "sub", "xor", "cmp"};
|
|
|
|
static const char kBitOp[8][4] = {"rol", "ror", "rcl", "rcr",
|
|
|
|
"shl", "shr", "sal", "sar"};
|
2020-09-28 08:13:56 +00:00
|
|
|
static const char kCc[16][3] = {"o", "no", "b", "ae", "e", "ne", "be", "a",
|
|
|
|
"s", "ns", "p", "np", "l", "ge", "le", "g"};
|
2020-08-25 11:23:25 +00:00
|
|
|
|
2020-08-27 06:08:08 +00:00
|
|
|
static bool IsProbablyByteOp(struct XedDecodedInst *x) {
|
|
|
|
return !(x->op.opcode & 1);
|
|
|
|
}
|
|
|
|
|
2020-09-28 08:13:56 +00:00
|
|
|
static int IsRepOpcode(struct Dis *d) {
|
|
|
|
switch (d->xedd->op.opcode & ~1) {
|
|
|
|
case 0x6C: // INS
|
2020-08-27 06:08:08 +00:00
|
|
|
return 1;
|
2020-09-28 08:13:56 +00:00
|
|
|
case 0x6E: // OUTS
|
2020-08-27 06:08:08 +00:00
|
|
|
return 1;
|
2020-09-28 08:13:56 +00:00
|
|
|
case 0xA4: // MOVS
|
2020-08-27 06:08:08 +00:00
|
|
|
return 1;
|
2020-09-28 08:13:56 +00:00
|
|
|
case 0xAA: // STOS
|
2020-08-27 06:08:08 +00:00
|
|
|
return 1;
|
2020-09-28 08:13:56 +00:00
|
|
|
case 0xAC: // LODS
|
2020-08-27 06:08:08 +00:00
|
|
|
return 1;
|
2020-09-28 08:13:56 +00:00
|
|
|
case 0xA6: // CMPS
|
2020-08-27 06:08:08 +00:00
|
|
|
return 2;
|
2020-09-28 08:13:56 +00:00
|
|
|
case 0xAE: // SCAS
|
2020-08-27 06:08:08 +00:00
|
|
|
return 2;
|
2020-08-25 11:23:25 +00:00
|
|
|
default:
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-09-28 08:13:56 +00:00
|
|
|
static char *DisRepPrefix(struct Dis *d, char *p) {
|
2020-08-25 11:23:25 +00:00
|
|
|
const char *s;
|
2020-09-28 08:13:56 +00:00
|
|
|
if (Rep(d->xedd->op.rde) && d->xedd->op.map == XED_ILD_MAP0) {
|
|
|
|
switch (IsRepOpcode(d)) {
|
2020-08-25 11:23:25 +00:00
|
|
|
case 0:
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
p = stpcpy(p, "rep ");
|
|
|
|
break;
|
|
|
|
case 2:
|
2020-09-28 08:13:56 +00:00
|
|
|
p = stpcpy(p, Rep(d->xedd->op.rde) == 2 ? "repnz " : "repz ");
|
2020-08-25 11:23:25 +00:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
2020-09-28 08:13:56 +00:00
|
|
|
static char *DisBranchTaken(struct Dis *d, char *p) {
|
|
|
|
switch (d->xedd->op.hint) {
|
2020-08-25 11:23:25 +00:00
|
|
|
case XED_HINT_NTAKEN:
|
|
|
|
return stpcpy(p, ",pn");
|
|
|
|
case XED_HINT_TAKEN:
|
|
|
|
return stpcpy(p, ",pt");
|
|
|
|
default:
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-09-28 08:13:56 +00:00
|
|
|
static char *DisName(struct Dis *d, char *bp, const char *name,
|
2020-08-25 11:23:25 +00:00
|
|
|
bool ambiguous) {
|
|
|
|
char *p, *np;
|
2020-09-07 04:39:00 +00:00
|
|
|
uint32_t rde;
|
2020-08-25 11:23:25 +00:00
|
|
|
bool notbyte, notlong, wantsuffix, wantsuffixsd;
|
|
|
|
p = bp;
|
2020-09-28 08:13:56 +00:00
|
|
|
rde = d->xedd->op.rde;
|
|
|
|
if (d->xedd->op.lock) p = stpcpy(p, "lock ");
|
|
|
|
p = DisRepPrefix(d, p);
|
2020-08-25 11:23:25 +00:00
|
|
|
if (tinystrcmp(name, "BIT") == 0) {
|
2020-09-07 04:39:00 +00:00
|
|
|
p = stpcpy(p, kBitOp[ModrmReg(rde)]);
|
2020-09-28 08:13:56 +00:00
|
|
|
} else if (tinystrcmp(name, "nop") == 0 && d->xedd->op.rep) {
|
|
|
|
p = stpcpy(p, "pause");
|
2020-08-25 11:23:25 +00:00
|
|
|
} else if (tinystrcmp(name, "CALL") == 0) {
|
|
|
|
p = stpcpy(p, "call");
|
|
|
|
} else if (tinystrcmp(name, "JMP") == 0) {
|
|
|
|
p = stpcpy(p, "jmp");
|
|
|
|
} else if (tinystrcmp(name, "jcxz") == 0) {
|
2020-09-07 04:39:00 +00:00
|
|
|
p = stpcpy(p, kJcxz[Eamode(rde)]);
|
2020-09-28 08:13:56 +00:00
|
|
|
p = DisBranchTaken(d, p);
|
2020-09-07 04:39:00 +00:00
|
|
|
} else if (tinystrcmp(name, "loop") == 0 || tinystrcmp(name, "loope") == 0 ||
|
|
|
|
tinystrcmp(name, "loopne") == 0) {
|
|
|
|
p = stpcpy(p, name);
|
|
|
|
if (Eamode(rde) != Mode(rde)) {
|
|
|
|
*p++ = "wl"[Eamode(rde)];
|
|
|
|
*p = '\0';
|
|
|
|
}
|
2020-09-28 08:13:56 +00:00
|
|
|
p = DisBranchTaken(d, p);
|
2020-08-25 11:23:25 +00:00
|
|
|
} else if (tinystrcmp(name, "cwtl") == 0) {
|
2020-09-07 04:39:00 +00:00
|
|
|
if (Osz(rde)) name = "cbtw";
|
|
|
|
if (Rexw(rde)) name = "cltq";
|
2020-08-25 11:23:25 +00:00
|
|
|
p = stpcpy(p, name);
|
|
|
|
} else if (tinystrcmp(name, "cltd") == 0) {
|
2020-09-07 04:39:00 +00:00
|
|
|
if (Osz(rde)) name = "cwtd";
|
|
|
|
if (Rexw(rde)) name = "cqto";
|
2020-08-25 11:23:25 +00:00
|
|
|
p = stpcpy(p, name);
|
|
|
|
} else {
|
|
|
|
notbyte = false;
|
|
|
|
notlong = false;
|
|
|
|
wantsuffix = false;
|
|
|
|
wantsuffixsd = false;
|
|
|
|
for (np = name; *np && (islower(*np) || isdigit(*np)); ++np) {
|
|
|
|
*p++ = *np;
|
|
|
|
}
|
|
|
|
if (tinystrcmp(name, "ALU") == 0) {
|
2020-09-28 08:13:56 +00:00
|
|
|
p = stpcpy(p, kAluOp[(d->xedd->op.opcode & 070) >> 3]);
|
|
|
|
} else if (tinystrcmp(name, "ALU2") == 0) {
|
2020-09-07 04:39:00 +00:00
|
|
|
p = stpcpy(p, kAluOp[ModrmReg(rde)]);
|
2020-08-25 11:23:25 +00:00
|
|
|
} else if (tinystrcmp(np, "WLQ") == 0) {
|
|
|
|
notbyte = true;
|
|
|
|
wantsuffix = true;
|
2020-09-28 08:13:56 +00:00
|
|
|
} else if (tinystrcmp(np, "CC") == 0) {
|
|
|
|
p = stpcpy(p, kCc[d->xedd->op.opcode & 15]);
|
|
|
|
p = DisBranchTaken(d, p);
|
2020-08-25 11:23:25 +00:00
|
|
|
} else if (tinystrcmp(np, "WQ") == 0) {
|
|
|
|
notbyte = true;
|
2020-09-07 04:39:00 +00:00
|
|
|
notlong = Eamode(rde) != XED_MODE_REAL;
|
2020-08-25 11:23:25 +00:00
|
|
|
wantsuffix = true;
|
|
|
|
} else if (tinystrcmp(np, "LQ") == 0 || tinystrcmp(np, "WL") == 0) {
|
|
|
|
notbyte = true;
|
|
|
|
wantsuffix = true;
|
|
|
|
} else if (tinystrcmp(np, "SD") == 0) {
|
|
|
|
notbyte = true;
|
|
|
|
wantsuffixsd = true;
|
|
|
|
} else if (tinystrcmp(np, "ABS") == 0) {
|
2020-09-07 04:39:00 +00:00
|
|
|
if (Rexw(rde)) p = stpcpy(p, "abs");
|
2020-08-25 11:23:25 +00:00
|
|
|
}
|
|
|
|
if (wantsuffixsd) {
|
2020-09-07 04:39:00 +00:00
|
|
|
if (Osz(rde)) {
|
2020-08-25 11:23:25 +00:00
|
|
|
*p++ = 'd';
|
|
|
|
} else {
|
|
|
|
*p++ = 's';
|
|
|
|
}
|
|
|
|
} else if (wantsuffix || (ambiguous && !startswith(name, "f") &&
|
|
|
|
!startswith(name, "set"))) {
|
2020-09-07 04:39:00 +00:00
|
|
|
if (Osz(rde)) {
|
2020-10-06 06:11:49 +00:00
|
|
|
if (ambiguous || Mode(rde) != XED_MODE_REAL) {
|
2020-09-07 04:39:00 +00:00
|
|
|
*p++ = 'w';
|
|
|
|
}
|
|
|
|
} else if (Rexw(rde)) {
|
2020-08-25 11:23:25 +00:00
|
|
|
*p++ = 'q';
|
2020-09-28 08:13:56 +00:00
|
|
|
} else if (ambiguous && !notbyte && IsProbablyByteOp(d->xedd)) {
|
2020-08-25 11:23:25 +00:00
|
|
|
*p++ = 'b';
|
|
|
|
} else if (!notlong) {
|
|
|
|
*p++ = 'l';
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
*p++ = ' ';
|
|
|
|
while (p - bp < 8) *p++ = ' ';
|
|
|
|
*p = '\0';
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Disassembles instruction based on string spec.
|
|
|
|
* @see DisSpec()
|
|
|
|
*/
|
2020-09-28 08:13:56 +00:00
|
|
|
char *DisInst(struct Dis *d, char *p, const char *spec) {
|
2020-08-25 11:23:25 +00:00
|
|
|
long i, n;
|
2020-10-06 06:11:49 +00:00
|
|
|
char sbuf[64];
|
|
|
|
char args[4][256];
|
2020-08-25 11:23:25 +00:00
|
|
|
char *s, *name, *state;
|
|
|
|
bool hasarg, hasmodrm, hasregister, hasmemory;
|
2020-09-28 08:13:56 +00:00
|
|
|
CHECK_EQ(0, (int)d->xedd->op.error);
|
2020-08-25 11:23:25 +00:00
|
|
|
DCHECK_LT(strlen(spec), 128);
|
|
|
|
hasarg = false;
|
2020-09-28 08:13:56 +00:00
|
|
|
hasmodrm = d->xedd->op.has_modrm;
|
|
|
|
hasmemory = hasmodrm && !IsModrmRegister(d->xedd->op.rde);
|
|
|
|
hasregister = hasmodrm && IsModrmRegister(d->xedd->op.rde);
|
2020-08-25 11:23:25 +00:00
|
|
|
name = strtok_r(strcpy(sbuf, spec), " ", &state);
|
|
|
|
for (n = 0; (s = strtok_r(NULL, " ", &state)); ++n) {
|
|
|
|
hasarg = true;
|
|
|
|
hasregister |= *s == '%';
|
|
|
|
hasmemory |= *s == 'O';
|
2020-09-28 08:13:56 +00:00
|
|
|
CHECK_LT(DisArg(d, args[n], s) - args[n], sizeof(args[n]));
|
2020-08-25 11:23:25 +00:00
|
|
|
}
|
2020-09-28 08:13:56 +00:00
|
|
|
p = HighStart(p, g_high.keyword);
|
|
|
|
p = DisName(d, p, name, hasarg && !hasregister && hasmemory);
|
|
|
|
p = HighEnd(p);
|
2020-08-25 11:23:25 +00:00
|
|
|
for (i = 0; i < n; ++i) {
|
|
|
|
if (i && args[n - i][0]) {
|
|
|
|
*p++ = ',';
|
|
|
|
}
|
|
|
|
p = stpcpy(p, args[n - i - 1]);
|
|
|
|
}
|
|
|
|
return p;
|
|
|
|
}
|