/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│ │vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│ ╞══════════════════════════════════════════════════════════════════════════════╡ │ Copyright 2020 Justine Alexandra Roberts Tunney │ │ │ │ This program is free software; you can redistribute it and/or modify │ │ it under the terms of the GNU General Public License as published by │ │ the Free Software Foundation; version 2 of the License. │ │ │ │ This program is distributed in the hope that it will be useful, but │ │ WITHOUT ANY WARRANTY; without even the implied warranty of │ │ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU │ │ General Public License for more details. │ │ │ │ You should have received a copy of the GNU General Public License │ │ along with this program; if not, write to the Free Software │ │ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA │ │ 02110-1301 USA │ ╚─────────────────────────────────────────────────────────────────────────────*/ #include "libc/assert.h" #include "libc/bits/popcnt.h" #include "libc/calls/calls.h" #include "libc/conv/conv.h" #include "libc/dce.h" #include "libc/intrin/pshufd.h" #include "libc/intrin/pshufhw.h" #include "libc/intrin/pshuflw.h" #include "libc/intrin/pshufw.h" #include "libc/intrin/shufpd.h" #include "libc/intrin/shufps.h" #include "libc/log/check.h" #include "libc/log/log.h" #include "libc/macros.h" #include "libc/math.h" #include "libc/nexgen32e/rdtsc.h" #include "libc/runtime/runtime.h" #include "libc/sysv/consts/clock.h" #include "libc/time/time.h" #include "tool/build/lib/abp.h" #include "tool/build/lib/alu.h" #include "tool/build/lib/bitscan.h" #include "tool/build/lib/case.h" #include "tool/build/lib/cond.h" #include "tool/build/lib/cpuid.h" #include "tool/build/lib/cvt.h" #include "tool/build/lib/divmul.h" #include "tool/build/lib/endian.h" #include "tool/build/lib/flags.h" #include "tool/build/lib/fpu.h" #include "tool/build/lib/ioports.h" #include "tool/build/lib/machine.h" #include "tool/build/lib/memory.h" #include "tool/build/lib/modrm.h" #include "tool/build/lib/sse.h" #include "tool/build/lib/stack.h" #include "tool/build/lib/stats.h" #include "tool/build/lib/string.h" #include "tool/build/lib/syscall.h" #include "tool/build/lib/throw.h" #define MUTATING true #define READONLY false #define UNCONDITIONAL true #define REG ModrmReg(m->xedd) #define UIMM0 m->xedd->op.uimm0 #define BITS (8 << RegLog2(m->xedd)) #define SIGN (1ull << (BITS - 1)) #define MASK (SIGN | (SIGN - 1)) #define SHIFTMASK (BITS - 1) typedef int int_v _Vector_size(16) aligned(16); typedef long long_v _Vector_size(16) aligned(16); typedef float float_v _Vector_size(16) aligned(16); typedef double double_v _Vector_size(16) aligned(16); typedef void (*machine_f)(struct Machine *); typedef void (*machine_u8p_u8p_f)(struct Machine *, uint8_t *, uint8_t *); typedef void (*alu_f)(struct Machine *, aluop2_f, bool); static uint64_t AluNot(struct Machine *m, uint64_t x) { return ~x & MASK; } static uint64_t AluNeg(struct Machine *m, uint64_t x) { m->flags = SetFlag(m->flags, FLAGS_CF, !!(x & MASK)); m->flags = SetFlag(m->flags, FLAGS_OF, (x & MASK) == SIGN); x = ~x + 1; m->flags = SetFlag(m->flags, FLAGS_ZF, !(x & MASK)); m->flags = SetFlag(m->flags, FLAGS_SF, !!(x & SIGN)); m->flags = SetLazyParityByte(m->flags, x); return x & MASK; } static uint64_t AluInc(struct Machine *m, uint64_t a) { uint64_t c; uint128_t x, z; a &= MASK; x = a; z = x + 1; c = z; m->flags = SetFlag(m->flags, FLAGS_ZF, !(c & MASK)); m->flags = SetFlag(m->flags, FLAGS_SF, !!(c & SIGN)); m->flags = SetFlag(m->flags, FLAGS_OF, !!((c ^ a) & (c ^ 1) & SIGN)); m->flags = SetLazyParityByte(m->flags, x); return c & MASK; } static uint64_t AluDec(struct Machine *m, uint64_t a) { uint64_t c; uint128_t x, z; a &= MASK; x = a; z = x - 1; c = z; m->flags = SetFlag(m->flags, FLAGS_ZF, !(c & MASK)); m->flags = SetFlag(m->flags, FLAGS_SF, !!(c & SIGN)); m->flags = SetFlag(m->flags, FLAGS_OF, !!((c ^ a) & (a ^ 1) & SIGN)); m->flags = SetLazyParityByte(m->flags, x); return c & MASK; } static void ImportFlags(struct Machine *m, uint64_t flags) { uint64_t old, mask = 0; mask |= 1u << FLAGS_CF; mask |= 1u << FLAGS_PF; mask |= 1u << FLAGS_AF; mask |= 1u << FLAGS_ZF; mask |= 1u << FLAGS_SF; mask |= 1u << FLAGS_TF; mask |= 1u << FLAGS_IF; mask |= 1u << FLAGS_DF; mask |= 1u << FLAGS_OF; mask |= 1u << FLAGS_NT; mask |= 1u << FLAGS_AC; mask |= 1u << FLAGS_ID; m->flags = (flags & mask) | (m->flags & ~mask); m->flags = SetFlag(m->flags, FLAGS_RF, false); m->flags = SetLazyParityByte(m->flags, !((m->flags >> FLAGS_PF) & 1)); } static uint64_t ReadMemory(struct Machine *m, uint8_t p[8]) { if (Rexw(m->xedd)) { return Read64(p); } else if (!Osz(m->xedd)) { return Read32(p); } else { return Read16(p); } } static int64_t ReadMemorySigned(struct Machine *m, uint8_t p[8]) { if (Rexw(m->xedd)) { return (int64_t)Read64(p); } else if (!Osz(m->xedd)) { return (int32_t)Read32(p); } else { return (int16_t)Read16(p); } } static void WriteRegister(struct Machine *m, uint8_t p[8], uint64_t x) { if (Rexw(m->xedd)) { Write64(p, x); } else if (!Osz(m->xedd)) { Write64(p, x & 0xffffffff); } else { Write16(p, x); } } static void WriteMemory(struct Machine *m, uint8_t p[8], uint64_t x) { if (Rexw(m->xedd)) { Write64(p, x); } else if (!Osz(m->xedd)) { Write32(p, x); } else { Write16(p, x); } } static void WriteRegisterOrMemory(struct Machine *m, uint8_t p[8], uint64_t x) { if (IsModrmRegister(m->xedd)) { WriteRegister(m, p, x); } else { WriteMemory(m, p, x); } } static void OpLfence(struct Machine *m) { } static void OpMfence(struct Machine *m) { } static void OpSfence(struct Machine *m) { } static void OpClflush(struct Machine *m) { } static void OpWutNopEv(struct Machine *m) { } static void OpCmc(struct Machine *m) { m->flags = SetFlag(m->flags, FLAGS_CF, !GetFlag(m->flags, FLAGS_CF)); } static void OpClc(struct Machine *m) { m->flags = SetFlag(m->flags, FLAGS_CF, false); } static void OpStc(struct Machine *m) { m->flags = SetFlag(m->flags, FLAGS_CF, true); } static void OpCli(struct Machine *m) { m->flags = SetFlag(m->flags, FLAGS_IF, false); } static void OpSti(struct Machine *m) { m->flags = SetFlag(m->flags, FLAGS_IF, true); } static void OpCld(struct Machine *m) { m->flags = SetFlag(m->flags, FLAGS_DF, false); } static void OpStd(struct Machine *m) { m->flags = SetFlag(m->flags, FLAGS_DF, true); } static void OpPushf(struct Machine *m) { PushOsz(m, ExportFlags(m->flags) & 0xFCFFFF); } static void OpPopf(struct Machine *m) { if (!Osz(m->xedd)) { ImportFlags(m, Pop64(m, 0)); } else { ImportFlags(m, (m->flags & ~0xFFFFull) | Pop16(m, 0)); } } static void OpLahf(struct Machine *m) { Write8(m->ax + 1, ExportFlags(m->flags)); } static void OpPushFs(struct Machine *m) { ThrowSegmentationFault(m, m->ip); } static void OpPopFs(struct Machine *m) { ThrowSegmentationFault(m, m->ip); } static void OpPushGs(struct Machine *m) { ThrowSegmentationFault(m, m->ip); } static void OpPopGs(struct Machine *m) { ThrowSegmentationFault(m, m->ip); } static void OpSahf(struct Machine *m) { ImportFlags(m, (m->flags & ~0xFFull) | m->ax[1]); } static void OpEbSetCc(struct Machine *m, bool x) { Write8(GetModrmRegisterBytePointerWrite(m), x); } static void OpLeaGvqpM(struct Machine *m) { Write64(RegRexrReg(m), ComputeAddress(m)); } static void PushVq(struct Machine *m, uint8_t *p) { if (!Osz(m->xedd)) { Push64(m, Read64(p)); } else { Push16(m, Read16(p)); } } static void PopVq(struct Machine *m, uint8_t *p) { if (!Osz(m->xedd)) { Write64(p, Pop64(m, 0)); } else { Write16(p, Pop16(m, 0)); } } static void OpPushEvq(struct Machine *m) { PushVq(m, GetModrmRegisterWordPointerReadOsz(m)); } static void OpPushZvq(struct Machine *m) { PushVq(m, RegRexbSrm(m)); } static void OpPopZvq(struct Machine *m) { PopVq(m, RegRexbSrm(m)); } static void OpPopEvq(struct Machine *m) { PopVq(m, GetModrmRegisterWordPointerWriteOsz(m)); } static void OpJmp(struct Machine *m) { m->ip += m->xedd->op.disp; } static void OpJmpEq(struct Machine *m) { m->ip = Read64(GetModrmRegisterWordPointerRead8(m)); } static void OpJcxz(struct Machine *m) { uint64_t count; count = Read64(m->cx); if (Asz(m->xedd)) count &= 0xffffffff; if (!count) OpJmp(m); } static void OpLoop(struct Machine *m, bool cond) { uint64_t count; count = Read64(m->cx) - 1; if (Asz(m->xedd)) count &= 0xffffffff; Write64(m->cx, count); if (count && cond) m->ip += m->xedd->op.disp; } static void OpXlat(struct Machine *m) { int64_t v; uint8_t al, *p; v = Read64(m->bx) + Read8(m->ax); if (Asz(m->xedd)) v &= 0xffffffff; SetReadAddr(m, v, 1); Write8(m->ax, Read8(ResolveAddress(m, v))); } static void OpEb(struct Machine *m, aluop1_f op) { uint8_t *p; p = GetModrmRegisterBytePointerWrite(m); Write8(p, op(m, Read8(p))); } static void OpEvqp(struct Machine *m, aluop1_f op) { uint8_t *p; p = GetModrmRegisterWordPointerWriteOszRexw(m); WriteRegisterOrMemory(m, p, op(m, ReadMemory(m, p))); } static void OpGvqpEvqp(struct Machine *m, aluop2_f op, bool write) { uint64_t x; x = op(m, ReadMemory(m, RegRexrReg(m)), ReadMemory(m, GetModrmRegisterWordPointerReadOszRexw(m))); if (write) WriteRegister(m, RegRexrReg(m), x); } static void OpEvqpGvqp(struct Machine *m, aluop2_f op, bool write) { uint8_t *p; uint64_t x, y; p = GetModrmRegisterWordPointerWriteOszRexw(m); x = ReadMemory(m, p); y = ReadMemory(m, RegRexrReg(m)); x = op(m, x, y); if (write) WriteRegisterOrMemory(m, p, x); } static void OpXchgZvqp(struct Machine *m) { uint64_t x, y; x = Read64(m->ax); y = Read64(RegRexbSrm(m)); WriteRegister(m, m->ax, y); WriteRegister(m, RegRexbSrm(m), x); } static void OpBofram(struct Machine *m) { if (m->xedd->op.disp) { m->bofram[0] = m->ip; m->bofram[1] = m->ip + (m->xedd->op.disp & 0xff); } else { m->bofram[0] = 0; m->bofram[1] = 0; } } static void OpNopEv(struct Machine *m) { if (m->xedd->op.modrm == 0x45) { OpBofram(m); } } static void OpPause(struct Machine *m) { sched_yield(); } static void OpNop(struct Machine *m) { if (m->xedd->op.rexb) { OpXchgZvqp(m); } else if (m->xedd->op.ild_f3) { OpPause(m); } } static void OpXchgGbEb(struct Machine *m) { uint8_t *b; uint8_t x, y; b = GetModrmRegisterBytePointerWrite(m); x = Read8(ByteRexrReg(m)); y = Read8(b); Write8(ByteRexrReg(m), y); Write8(b, x); } static void OpXchgGvqpEvqp(struct Machine *m) { uint8_t *p; uint64_t x, y; p = GetModrmRegisterWordPointerWriteOszRexw(m); x = ReadMemory(m, RegRexrReg(m)); y = ReadMemory(m, p); WriteRegister(m, RegRexrReg(m), y); WriteRegisterOrMemory(m, p, x); } static void OpCmpxchgEbAlGb(struct Machine *m) { uint8_t *p; uint8_t x, y, z; p = GetModrmRegisterBytePointerWrite(m); x = Read8(m->ax); y = Read8(p); z = Read8(ByteRexrReg(m)); Alu(0, ALU_SUB, x, y, &m->flags); if (GetFlag(m->flags, FLAGS_ZF)) { Write8(p, z); } else { Write8(m->ax, y); } } static void OpCmpxchgEvqpRaxGvqp(struct Machine *m) { uint8_t *p; uint64_t x, y, z; p = GetModrmRegisterWordPointerWriteOszRexw(m); x = ReadMemory(m, m->ax); y = ReadMemory(m, p); z = ReadMemory(m, RegRexrReg(m)); Alu(RegLog2(m->xedd), ALU_SUB, x, y, &m->flags); if (GetFlag(m->flags, FLAGS_ZF)) { WriteRegisterOrMemory(m, p, z); } else { WriteRegister(m, m->ax, y); } } static void OpCmpxchg8b(struct Machine *m) { uint8_t *p; uint32_t d, a; p = GetModrmRegisterXmmPointerRead8(m); a = Read32(p + 0); d = Read32(p + 4); if (a == Read32(m->ax) && d == Read32(m->dx)) { SetFlag(m->flags, FLAGS_ZF, true); memcpy(p + 0, m->bx, 4); memcpy(p + 4, m->cx, 4); } else { SetFlag(m->flags, FLAGS_ZF, false); Write32(m->ax, a); Write32(m->dx, d); } } static void OpCmpxchg16b(struct Machine *m) { uint8_t *p; uint64_t d, a; p = GetModrmRegisterXmmPointerRead16(m); a = Read64(p + 0); d = Read64(p + 8); if (a == Read64(m->ax) && d == Read64(m->dx)) { SetFlag(m->flags, FLAGS_ZF, true); memcpy(p + 0, m->bx, 8); memcpy(p + 8, m->cx, 8); } else { SetFlag(m->flags, FLAGS_ZF, false); Write64(m->ax, a); Write64(m->dx, d); } } static void OpCmpxchgDxAx(struct Machine *m) { if (Rexw(m->xedd)) { OpCmpxchg16b(m); } else { OpCmpxchg8b(m); } } static uint64_t OpDoubleShift(struct Machine *m, uint64_t x, uint64_t y) { uint8_t b, w, W[2][2] = {{2, 3}, {1, 3}}; return BsuDoubleShift( W[Osz(m->xedd)][Rexw(m->xedd)], x, y, m->xedd->op.opcode & 1 ? Read8(m->cx) : m->xedd->op.uimm0, m->xedd->op.opcode & 8, &m->flags); } static uint64_t OpBts(uint64_t x, uint64_t y) { return x | y; } static uint64_t OpBtr(uint64_t x, uint64_t y) { return x & ~y; } static uint64_t OpBtc(uint64_t x, uint64_t y) { return (x & ~y) | (~x & y); } static void OpBit(struct Machine *m) { int op; uint8_t *p; unsigned bit; int64_t disp; uint64_t v, x, y, z; uint8_t w, W[2][2] = {{2, 3}, {1, 3}}; w = W[Osz(m->xedd)][Rexw(m->xedd)]; if (m->xedd->op.opcode == 0xBA) { op = ModrmReg(m->xedd); bit = m->xedd->op.uimm0 & ((8 << w) - 1); disp = 0; } else { op = (m->xedd->op.opcode & 070) >> 3; disp = ReadMemorySigned(m, RegRexrReg(m)); bit = disp & ((8 << w) - 1); disp &= -(8 << w); disp >>= 3; } if (IsModrmRegister(m->xedd)) { p = RegRexbRm(m); } else { v = ComputeAddress(m) + disp; if (Asz(m->xedd)) v &= 0xffffffff; p = ReserveAddress(m, v, 1 << w); if (op == 4) { SetReadAddr(m, v, 1 << w); } else { SetWriteAddr(m, v, 1 << w); } } y = 1ull << bit; x = ReadMemory(m, p); m->flags = SetFlag(m->flags, FLAGS_CF, !!(y & x)); switch (op) { case 4: return; case 5: z = OpBts(x, y); break; case 6: z = OpBtr(x, y); break; case 7: z = OpBtc(x, y); break; default: OpUd(m); } WriteRegisterOrMemory(m, p, z); } static void OpConvert1(struct Machine *m) { if (Rexw(m->xedd)) { Write64(m->ax, Read32(m->ax) | (Read32(m->ax) & 0x80000000 ? 0xffffffff00000000 : 0)); } else if (!Osz(m->xedd)) { Write64(m->ax, Read16(m->ax) | (Read16(m->ax) & 0x8000 ? 0xffff0000 : 0)); } else { Write16(m->ax, Read8(m->ax) | (Read8(m->ax) & 0x0080 ? 0xff00 : 0)); } } static void OpConvert2(struct Machine *m) { if (Rexw(m->xedd)) { Write64(m->dx, Read64(m->ax) & 0x8000000000000000 ? 0xffffffffffffffff : 0); } else if (!Osz(m->xedd)) { Write64(m->dx, Read32(m->ax) & 0x80000000 ? 0xffffffff : 0); } else { Write16(m->dx, Read16(m->ax) & 0x8000 ? 0xffff : 0); } } static void OpBswapZvqp(struct Machine *m) { uint64_t x; x = Read64(RegRexbSrm(m)); if (Rexw(m->xedd)) { Write64( RegRexbSrm(m), ((x & 0xff00000000000000) >> 070 | (x & 0x00000000000000ff) << 070 | (x & 0x00ff000000000000) >> 050 | (x & 0x000000000000ff00) << 050 | (x & 0x0000ff0000000000) >> 030 | (x & 0x0000000000ff0000) << 030 | (x & 0x000000ff00000000) >> 010 | (x & 0x00000000ff000000) << 010)); } else if (!Osz(m->xedd)) { Write64(RegRexbSrm(m), ((x & 0xff000000) >> 030 | (x & 0x000000ff) << 030 | (x & 0x00ff0000) >> 010 | (x & 0x0000ff00) << 010)); } else { Write16(RegRexbSrm(m), (x & 0x00ff) << 010 | (x & 0xff00) << 010); } } static uint8_t pmovmskb(uint64_t x) { return (x & 0x0000000000000080) >> 007 | (x & 0x0000000000008000) >> 016 | (x & 0x0000000000800000) >> 025 | (x & 0x0000000080000000) >> 034 | (x & 0x0000008000000000) >> 043 | (x & 0x0000800000000000) >> 052 | (x & 0x0080000000000000) >> 061 | (x & 0x8000000000000000) >> 070; } static void OpPmovmskbGdqpNqUdq(struct Machine *m) { uint64_t bitmask; if (Prefix66(m->xedd)) { bitmask = pmovmskb(Read64(XmmRexbRm(m) + 8)) << 8 | pmovmskb(Read64(XmmRexbRm(m))); } else { bitmask = pmovmskb(Read64(MmRm(m) + 8)) << 8 | pmovmskb(Read64(MmRm(m))); } Write64(RegRexrReg(m), bitmask); } static void OpRdtsc(struct Machine *m) { uint64_t c; #ifdef __x86_64__ c = rdtsc(); #else struct timespec ts; clock_gettime(CLOCK_MONOTONIC, &ts); c = ts.tv_sec * 1000000000 + ts.tv_nsec; #endif Write64(m->ax, c & 0xffffffff); c >>= 32; Write64(m->dx, c & 0xffffffff); } static void OpMovEvqpSw(struct Machine *m) { ThrowSegmentationFault(m, m->ip); } static void OpMovSwEvqp(struct Machine *m) { ThrowSegmentationFault(m, m->ip); } static void OpMovEbIb(struct Machine *m) { Write8(GetModrmRegisterBytePointerWrite(m), m->xedd->op.uimm0); } static void OpMovAlOb(struct Machine *m) { memcpy(ResolveAddress(m, m->xedd->op.uimm0), m->ax, 1); } static void OpMovObAl(struct Machine *m) { memcpy(m->ax, ResolveAddress(m, m->xedd->op.uimm0), 1); } static void OpMovRaxOvqp(struct Machine *m) { WriteRegister(m, m->ax, ReadMemory(m, ResolveAddress(m, m->xedd->op.uimm0))); } static void OpMovOvqpRax(struct Machine *m) { WriteMemory(m, ResolveAddress(m, m->xedd->op.uimm0), Read64(m->ax)); } static void OpMovEbGb(struct Machine *m) { memcpy(GetModrmRegisterBytePointerWrite(m), ByteRexrReg(m), 1); } static void OpMovGbEb(struct Machine *m) { memcpy(ByteRexrReg(m), GetModrmRegisterBytePointerRead(m), 1); } static void OpMovZbIb(struct Machine *m) { Write8(ByteRexbSrm(m), m->xedd->op.uimm0); } static void OpMovZvqpIvqp(struct Machine *m) { WriteRegister(m, RegRexbSrm(m), m->xedd->op.uimm0); } static void OpMovEvqpIvds(struct Machine *m) { WriteRegisterOrMemory(m, GetModrmRegisterWordPointerWriteOszRexw(m), m->xedd->op.uimm0); } static void OpMovEvqpGvqp(struct Machine *m) { WriteRegisterOrMemory(m, GetModrmRegisterWordPointerWriteOszRexw(m), ReadMemory(m, RegRexrReg(m))); } static void OpMovGvqpEvqp(struct Machine *m) { WriteRegister(m, RegRexrReg(m), ReadMemory(m, GetModrmRegisterWordPointerReadOszRexw(m))); } static void OpMovzbGvqpEb(struct Machine *m) { WriteRegister(m, RegRexrReg(m), Read8(GetModrmRegisterBytePointerRead(m))); } static void OpMovzwGvqpEw(struct Machine *m) { WriteRegister(m, RegRexrReg(m), Read16(GetModrmRegisterWordPointerRead2(m))); } static void OpMovsbGvqpEb(struct Machine *m) { WriteRegister(m, RegRexrReg(m), (int8_t)Read8(GetModrmRegisterBytePointerRead(m))); } static void OpMovswGvqpEw(struct Machine *m) { WriteRegister(m, RegRexrReg(m), (int16_t)Read16(GetModrmRegisterWordPointerRead2(m))); } static void OpMovsxdGdqpEd(struct Machine *m) { uint64_t x; uint8_t *p; x = (int32_t)Read32(GetModrmRegisterWordPointerRead4(m)); if (!Rexw(m->xedd)) x &= 0xffffffff; /* wut */ Write64(RegRexrReg(m), x); } static void OpMovdquVdqWdq(struct Machine *m) { memcpy(XmmRexrReg(m), GetModrmRegisterXmmPointerRead16(m), 16); } static void OpMovdquWdqVdq(struct Machine *m) { memcpy(GetModrmRegisterXmmPointerWrite16(m), XmmRexrReg(m), 16); } static void OpMovupsVpsWps(struct Machine *m) { OpMovdquVdqWdq(m); } static void OpMovupsWpsVps(struct Machine *m) { OpMovdquWdqVdq(m); } static void OpMovupdVpsWps(struct Machine *m) { OpMovdquVdqWdq(m); } static void OpMovupdWpsVps(struct Machine *m) { OpMovdquWdqVdq(m); } static void OpLddquVdqMdq(struct Machine *m) { OpMovdquVdqWdq(m); } static void OpMovdqaVdqMdq(struct Machine *m) { int64_t v; uint8_t *p; v = ComputeAddress(m); SetReadAddr(m, v, 16); if ((v & 15) || !(p = FindReal(m, v))) ThrowSegmentationFault(m, v); memcpy(XmmRexrReg(m), Abp16(p), 16); } static void OpMovdqaMdqVdq(struct Machine *m) { int64_t v; uint8_t *p; v = ComputeAddress(m); SetWriteAddr(m, v, 16); if ((v & 15) || !(p = FindReal(m, v))) ThrowSegmentationFault(m, v); memcpy(Abp16(p), XmmRexrReg(m), 16); } static void OpMovdqaVdqWdq(struct Machine *m) { if (IsModrmRegister(m->xedd)) { memcpy(XmmRexrReg(m), XmmRexbRm(m), 16); } else { OpMovdqaVdqMdq(m); } } static void OpMovdqaWdqVdq(struct Machine *m) { if (IsModrmRegister(m->xedd)) { memcpy(XmmRexbRm(m), XmmRexrReg(m), 16); } else { OpMovdqaMdqVdq(m); } } static void OpMovntiMdqpGdqp(struct Machine *m) { int64_t v; uint8_t *a; void *p[2]; uint8_t n, b[8]; v = ComputeAddress(m); n = Rexw(m->xedd) ? 8 : 4; a = BeginStore(m, v, n, p, b); SetWriteAddr(m, v, n); memcpy(p, XmmRexrReg(m), n); EndStore(m, v, n, p, b); } static void OpMovntdqMdqVdq(struct Machine *m) { OpMovdqaMdqVdq(m); } static void OpMovntpsMpsVps(struct Machine *m) { OpMovdqaMdqVdq(m); } static void OpMovntpdMpdVpd(struct Machine *m) { OpMovdqaMdqVdq(m); } static void OpMovntdqaVdqMdq(struct Machine *m) { OpMovdqaVdqMdq(m); } static void OpMovqPqQq(struct Machine *m) { memcpy(MmReg(m), GetModrmRegisterMmPointerRead8(m), 8); } static void OpMovqQqPq(struct Machine *m) { memcpy(GetModrmRegisterMmPointerWrite8(m), MmReg(m), 8); } static void OpMovqVdqEqp(struct Machine *m) { memcpy(XmmRexrReg(m), GetModrmRegisterWordPointerRead8(m), 8); memset(XmmRexrReg(m) + 8, 0, 8); } static void OpMovdVdqEd(struct Machine *m) { memset(XmmRexrReg(m), 0, 16); memcpy(XmmRexrReg(m), GetModrmRegisterWordPointerRead4(m), 4); } static void OpMovqPqEqp(struct Machine *m) { memcpy(MmReg(m), GetModrmRegisterWordPointerRead8(m), 8); } static void OpMovdPqEd(struct Machine *m) { memcpy(MmReg(m), GetModrmRegisterWordPointerRead4(m), 4); memset(MmReg(m) + 4, 0, 4); } static void OpMovdEdVdq(struct Machine *m) { if (IsModrmRegister(m->xedd)) { memset(RegRexbRm(m), 0, 16); memcpy(RegRexbRm(m), XmmRexrReg(m), 4); } else { memcpy(ComputeReserveAddressWrite4(m), XmmRexrReg(m), 4); } } static void OpMovqEqpVdq(struct Machine *m) { memcpy(GetModrmRegisterWordPointerWrite8(m), XmmRexrReg(m), 8); } static void OpMovdEdPq(struct Machine *m) { if (IsModrmRegister(m->xedd)) { memcpy(RegRexbRm(m), MmReg(m), 4); memset(RegRexbRm(m) + 4, 0, 4); } else { memcpy(ComputeReserveAddressWrite4(m), MmReg(m), 4); } } static void OpMovqEqpPq(struct Machine *m) { memcpy(GetModrmRegisterWordPointerWrite(m, 8), MmReg(m), 8); } static void OpMovntqMqPq(struct Machine *m) { memcpy(ComputeReserveAddressWrite8(m), MmReg(m), 8); } static void OpMovqVqWq(struct Machine *m) { memcpy(XmmRexrReg(m), GetModrmRegisterXmmPointerRead8(m), 8); memset(XmmRexrReg(m) + 8, 0, 8); } static void OpMovssVpsWps(struct Machine *m) { memcpy(XmmRexrReg(m), GetModrmRegisterXmmPointerRead4(m), 4); } static void OpMovssWpsVps(struct Machine *m) { memcpy(GetModrmRegisterXmmPointerWrite4(m), XmmRexrReg(m), 4); } static void OpMovsdVpsWps(struct Machine *m) { memcpy(XmmRexrReg(m), GetModrmRegisterXmmPointerRead16(m), 8); } static void OpMovsdWpsVps(struct Machine *m) { memcpy(GetModrmRegisterXmmPointerWrite16(m), XmmRexrReg(m), 8); } static void OpMaskMovDiXmmRegXmmRm(struct Machine *m) { void *p[2]; uint64_t v; unsigned i, n; uint8_t *mem, b[16]; n = Prefix66(m->xedd) ? 16 : 8; v = GetSegment() + Read64(m->di); if (Asz(m->xedd)) v &= 0xffffffff; mem = BeginStore(m, v, n, p, b); for (i = 0; i < n; ++i) { if (XmmRexbRm(m)[i] & 0x80) { mem[i] = XmmRexrReg(m)[i]; } } EndStore(m, v, n, p, b); } static void OpMovhlpsVqUq(struct Machine *m) { memcpy(XmmRexrReg(m), XmmRexbRm(m) + 8, 8); } static void OpMovlpsVqMq(struct Machine *m) { memcpy(XmmRexrReg(m), ComputeReserveAddressRead8(m), 8); } static void OpMovlpdVqMq(struct Machine *m) { memcpy(XmmRexrReg(m), ComputeReserveAddressRead8(m), 8); } static void OpMovddupVqWq(struct Machine *m) { uint8_t *dst, *src; dst = XmmRexrReg(m); src = GetModrmRegisterXmmPointerRead8(m); memcpy(dst + 0, src, 8); memcpy(dst + 8, src, 8); } static void OpMovsldupVqWq(struct Machine *m) { uint8_t *dst, *src; dst = XmmRexrReg(m); src = GetModrmRegisterXmmPointerRead16(m); memcpy(dst + 0 + 0, src + 0, 4); memcpy(dst + 0 + 4, src + 0, 4); memcpy(dst + 8 + 0, src + 8, 4); memcpy(dst + 8 + 4, src + 8, 4); } static void OpMovlpsMqVq(struct Machine *m) { memcpy(ComputeReserveAddressWrite8(m), XmmRexrReg(m), 8); } static void OpMovlpdMqVq(struct Machine *m) { memcpy(ComputeReserveAddressWrite8(m), XmmRexrReg(m), 8); } static void OpMovlhpsVqUq(struct Machine *m) { memcpy(XmmRexrReg(m) + 8, XmmRexbRm(m), 8); } static void OpMovhpsVqMq(struct Machine *m) { memcpy(XmmRexrReg(m) + 8, ComputeReserveAddressRead8(m), 8); } static void OpMovhpdVqMq(struct Machine *m) { memcpy(XmmRexrReg(m) + 8, ComputeReserveAddressRead8(m), 8); } static void OpMovshdupVqWq(struct Machine *m) { uint8_t *dst, *src; dst = XmmRexrReg(m); src = GetModrmRegisterXmmPointerRead16(m); memcpy(dst + 0 + 0, src + 04, 4); memcpy(dst + 0 + 4, src + 04, 4); memcpy(dst + 8 + 0, src + 12, 4); memcpy(dst + 8 + 4, src + 12, 4); } static void OpMovhpsMqVq(struct Machine *m) { memcpy(ComputeReserveAddressRead8(m), XmmRexrReg(m) + 8, 8); } static void OpMovhpdMqVq(struct Machine *m) { memcpy(ComputeReserveAddressRead8(m), XmmRexrReg(m) + 8, 8); } static void OpMovqWqVq(struct Machine *m) { if (IsModrmRegister(m->xedd)) { memcpy(XmmRexbRm(m), XmmRexrReg(m), 8); memset(XmmRexbRm(m) + 8, 0, 8); } else { memcpy(ComputeReserveAddressWrite8(m), XmmRexrReg(m), 8); } } static void OpMovq2dqVdqNq(struct Machine *m) { memcpy(XmmRexrReg(m), MmRm(m), 8); memset(XmmRexrReg(m) + 8, 0, 8); } static void OpMovdq2qPqUq(struct Machine *m) { memcpy(MmReg(m), XmmRexbRm(m), 8); } static void OpMovapsVpsWps(struct Machine *m) { OpMovdqaVdqWdq(m); } static void OpMovapdVpdWpd(struct Machine *m) { OpMovdqaVdqWdq(m); } static void OpMovapsWpsVps(struct Machine *m) { OpMovdqaWdqVdq(m); } static void OpMovapdWpdVpd(struct Machine *m) { OpMovdqaWdqVdq(m); } static void OpMovWpsVps(struct Machine *m) { uint8_t *p, *r; switch (m->xedd->op.rep | Prefix66(m->xedd)) { case 0: OpMovupsWpsVps(m); break; case 1: OpMovupdWpsVps(m); break; case 2: OpMovsdWpsVps(m); break; case 3: OpMovssWpsVps(m); break; default: unreachable; } } static void OpMov0f28(struct Machine *m) { if (!Prefix66(m->xedd)) { OpMovapsVpsWps(m); } else { OpMovapdVpdWpd(m); } } static void OpMov0f6e(struct Machine *m) { if (Prefix66(m->xedd)) { if (Rexw(m->xedd)) { OpMovqVdqEqp(m); } else { OpMovdVdqEd(m); } } else { if (Rexw(m->xedd)) { OpMovqPqEqp(m); } else { OpMovdPqEd(m); } } } static void OpMov0f6f(struct Machine *m) { if (Prefix66(m->xedd)) { OpMovdqaVdqWdq(m); } else if (m->xedd->op.ild_f3) { OpMovdquVdqWdq(m); } else { OpMovqPqQq(m); } } static void OpMov0fE7(struct Machine *m) { if (!Prefix66(m->xedd)) { OpMovntqMqPq(m); } else { OpMovntdqMdqVdq(m); } } static void OpMov0f7e(struct Machine *m) { if (m->xedd->op.ild_f3) { OpMovqVqWq(m); } else if (Prefix66(m->xedd)) { if (Rexw(m->xedd)) { OpMovqEqpVdq(m); } else { OpMovdEdVdq(m); } } else { if (Rexw(m->xedd)) { OpMovqEqpPq(m); } else { OpMovdEdPq(m); } } } static void OpMov0f7f(struct Machine *m) { if (m->xedd->op.ild_f3) { OpMovdquWdqVdq(m); } else if (Prefix66(m->xedd)) { OpMovdqaWdqVdq(m); } else { OpMovqQqPq(m); } } static void OpMov0f10(struct Machine *m) { uint8_t *p, *r; switch (m->xedd->op.rep | Prefix66(m->xedd)) { case 0: OpMovupsVpsWps(m); break; case 1: OpMovupdVpsWps(m); break; case 2: OpMovsdVpsWps(m); break; case 3: OpMovssVpsWps(m); break; default: unreachable; } } static void OpMov0f29(struct Machine *m) { if (!Prefix66(m->xedd)) { OpMovapsWpsVps(m); } else { OpMovapdWpdVpd(m); } } static void OpMov0f2b(struct Machine *m) { if (!Prefix66(m->xedd)) { OpMovntpsMpsVps(m); } else { OpMovntpdMpdVpd(m); } } static void OpMov0f12(struct Machine *m) { switch (m->xedd->op.rep | Prefix66(m->xedd)) { case 0: if (IsModrmRegister(m->xedd)) { OpMovhlpsVqUq(m); } else { OpMovlpsVqMq(m); } break; case 1: OpMovlpdVqMq(m); break; case 2: OpMovddupVqWq(m); break; case 3: OpMovsldupVqWq(m); break; default: unreachable; } } static void OpMov0f13(struct Machine *m) { if (Prefix66(m->xedd)) { OpMovlpdMqVq(m); } else { OpMovlpsMqVq(m); } } static void OpMov0f16(struct Machine *m) { switch (m->xedd->op.rep | Prefix66(m->xedd)) { case 0: if (IsModrmRegister(m->xedd)) { OpMovlhpsVqUq(m); } else { OpMovhpsVqMq(m); } break; case 1: OpMovhpdVqMq(m); break; case 3: OpMovshdupVqWq(m); break; default: OpUd(m); break; } } static void OpMov0f17(struct Machine *m) { if (Prefix66(m->xedd)) { OpMovhpdMqVq(m); } else { OpMovhpsMqVq(m); } } static void OpMov0fD6(struct Machine *m) { if (m->xedd->op.ild_f3) { OpMovq2dqVdqNq(m); } else if (m->xedd->op.ild_f2) { OpMovdq2qPqUq(m); } else if (Prefix66(m->xedd)) { OpMovqWqVq(m); } else { OpUd(m); } } static void OpUnpcklpsd(struct Machine *m) { uint8_t *a, *b; a = XmmRexrReg(m); b = GetModrmRegisterXmmPointerRead8(m); if (Prefix66(m->xedd)) { memcpy(a + 8, b, 8); } else { memcpy(a + 4 * 3, b + 4, 4); memcpy(a + 4 * 2, a + 4, 4); memcpy(a + 4 * 1, b + 0, 4); } } static void OpUnpckhpsd(struct Machine *m) { uint8_t *a, *b; a = XmmRexrReg(m); b = GetModrmRegisterXmmPointerRead16(m); if (Prefix66(m->xedd)) { memcpy(a + 0, b + 8, 8); memcpy(a + 8, b + 8, 8); } else { memcpy(a + 4 * 0, a + 4 * 2, 4); memcpy(a + 4 * 1, b + 4 * 2, 4); memcpy(a + 4 * 2, a + 4 * 3, 4); memcpy(a + 4 * 3, b + 4 * 3, 4); } } static void OpPextrwGdqpUdqIb(struct Machine *m) { uint8_t i; i = m->xedd->op.uimm0; i &= Prefix66(m->xedd) ? 7 : 3; Write16(RegRexrReg(m), Read16(XmmRexbRm(m) + i * 2)); } static void OpPinsrwVdqEwIb(struct Machine *m) { uint8_t i; i = m->xedd->op.uimm0; i &= Prefix66(m->xedd) ? 7 : 3; Write16(XmmRexrReg(m) + i * 2, Read16(GetModrmRegisterWordPointerRead2(m))); } static void OpShuffle(struct Machine *m) { int16_t q16[4]; int16_t x16[8]; int32_t x32[4]; switch (m->xedd->op.rep | Prefix66(m->xedd)) { case 0: memcpy(q16, GetModrmRegisterXmmPointerRead8(m), 8); (pshufw)(q16, q16, m->xedd->op.uimm0); memcpy(XmmRexrReg(m), q16, 8); break; case 1: memcpy(x32, GetModrmRegisterXmmPointerRead16(m), 16); (pshufd)(x32, x32, m->xedd->op.uimm0); memcpy(XmmRexrReg(m), x32, 16); break; case 2: memcpy(x16, GetModrmRegisterXmmPointerRead16(m), 16); (pshuflw)(x16, x16, m->xedd->op.uimm0); memcpy(XmmRexrReg(m), x16, 16); break; case 3: memcpy(x16, GetModrmRegisterXmmPointerRead16(m), 16); (pshufhw)(x16, x16, m->xedd->op.uimm0); memcpy(XmmRexrReg(m), x16, 16); break; default: unreachable; } } static void OpShufpsd(struct Machine *m) { float s[4]; double d[2]; if (Prefix66(m->xedd)) { memcpy(d, GetModrmRegisterXmmPointerRead16(m), 16); (shufpd)(d, d, m->xedd->op.uimm0); memcpy(XmmRexrReg(m), d, 16); } else { memcpy(s, GetModrmRegisterXmmPointerRead16(m), 16); (shufps)(s, s, m->xedd->op.uimm0); memcpy(XmmRexrReg(m), s, 16); } } static void OpSqrtpsd(struct Machine *m) { long i; float_v xf; double_v xd; switch (m->xedd->op.rep | Prefix66(m->xedd)) { case 0: memcpy(&xf, GetModrmRegisterXmmPointerRead16(m), 16); for (i = 0; i < 4; ++i) xf[i] = sqrtf(xf[i]); memcpy(XmmRexrReg(m), &xf, 16); break; case 1: memcpy(&xd, GetModrmRegisterXmmPointerRead16(m), 16); for (i = 0; i < 2; ++i) xd[i] = sqrt(xd[i]); memcpy(XmmRexrReg(m), &xd, 16); break; case 2: memcpy(&xd, GetModrmRegisterXmmPointerRead8(m), 8); xd[0] = sqrt(xd[0]); memcpy(XmmRexrReg(m), &xd, 8); break; case 3: memcpy(&xf, GetModrmRegisterXmmPointerRead4(m), 4); xf[0] = sqrtf(xf[0]); memcpy(XmmRexrReg(m), &xf, 4); break; default: unreachable; } } static void OpRsqrtps(struct Machine *m) { unsigned i; float_v x; if (!m->xedd->op.ild_f3) { memcpy(&x, GetModrmRegisterXmmPointerRead16(m), 16); for (i = 0; i < 4; ++i) x[i] = 1.f / sqrtf(x[i]); memcpy(XmmRexrReg(m), &x, 16); } else { memcpy(&x, GetModrmRegisterXmmPointerRead4(m), 4); x[0] = 1.f / sqrtf(x[0]); memcpy(XmmRexrReg(m), &x, 4); } } static void OpRcpps(struct Machine *m) { int i; float_v x; if (!m->xedd->op.ild_f3) { memcpy(&x, GetModrmRegisterXmmPointerRead16(m), 16); for (i = 0; i < 4; ++i) x[i] = 1.f / x[i]; memcpy(XmmRexrReg(m), &x, 16); } else { memcpy(&x, GetModrmRegisterXmmPointerRead4(m), 4); x[0] = 1.f / x[0]; memcpy(XmmRexrReg(m), &x, 4); } } static void OpVpsdWpsd(struct Machine *m, float_v opf(struct Machine *, float_v, float_v), double_v opd(struct Machine *, double_v, double_v), bool isfloat, bool isdouble) { float_v xf, yf; double_v xd, yd; if (isfloat) { memcpy(&xf, XmmRexrReg(m), 16); memcpy(&yf, GetModrmRegisterXmmPointerRead16(m), 16); xf = opf(m, xf, yf); memcpy(XmmRexrReg(m), &xf, 16); } else if (isdouble) { memcpy(&xd, XmmRexrReg(m), 16); memcpy(&yd, GetModrmRegisterXmmPointerRead16(m), 16); xd = opd(m, xd, yd); memcpy(XmmRexrReg(m), &xd, 16); } else { OpUd(m); } } static void OpVpsdWpsd66(struct Machine *m, float_v opf(struct Machine *, float_v, float_v), double_v opd(struct Machine *, double_v, double_v)) { OpVpsdWpsd(m, opf, opd, !Prefix66(m->xedd), Prefix66(m->xedd)); } static void OpVpsdWpsd66f2(struct Machine *m, float_v opf(struct Machine *, float_v, float_v), double_v opd(struct Machine *, double_v, double_v)) { OpVpsdWpsd(m, opf, opd, m->xedd->op.ild_f2, Prefix66(m->xedd)); } static void OpVspsdWspsd(struct Machine *m, float_v opf(struct Machine *, float_v, float_v), double_v opd(struct Machine *, double_v, double_v)) { float_v xf, yf; double_v xd, yd; switch (m->xedd->op.rep | Prefix66(m->xedd)) { case 0: memcpy(&yf, GetModrmRegisterXmmPointerRead16(m), 16); memcpy(&xf, XmmRexrReg(m), 16); xf = opf(m, xf, yf); memcpy(XmmRexrReg(m), &xf, 16); break; case 1: memcpy(&yd, GetModrmRegisterXmmPointerRead16(m), 16); memcpy(&xd, XmmRexrReg(m), 16); xd = opd(m, xd, yd); memcpy(XmmRexrReg(m), &xd, 16); break; case 2: memcpy(&yd, GetModrmRegisterXmmPointerRead8(m), 8); memcpy(&xd, XmmRexrReg(m), 8); xd = opd(m, xd, yd); memcpy(XmmRexrReg(m), &xd, 8); break; case 3: memcpy(&yf, GetModrmRegisterXmmPointerRead4(m), 4); memcpy(&xf, XmmRexrReg(m), 4); xf = opf(m, xf, yf); memcpy(XmmRexrReg(m), &xf, 4); break; default: unreachable; } } static void OpComissVsWs(struct Machine *m) { float xf, yf; double xd, yd; uint8_t zf, cf, pf, ie; if (!Prefix66(m->xedd)) { memcpy(&xf, XmmRexrReg(m), 4); memcpy(&yf, GetModrmRegisterXmmPointerRead4(m), 4); if (!isnan(xf) && !isnan(yf)) { zf = xf == yf; cf = xf < yf; pf = false; ie = false; } else { zf = cf = pf = ie = true; } } else { memcpy(&xd, XmmRexrReg(m), 8); memcpy(&yd, GetModrmRegisterXmmPointerRead8(m), 8); if (!isnan(xd) && !isnan(yd)) { zf = xd == yd; cf = xd < yd; pf = false; ie = false; } else { zf = cf = pf = ie = true; } } m->flags = SetFlag(m->flags, FLAGS_ZF, zf); m->flags = SetFlag(m->flags, FLAGS_PF, pf); m->flags = SetFlag(m->flags, FLAGS_CF, cf); m->flags = SetFlag(m->flags, FLAGS_SF, false); m->flags = SetFlag(m->flags, FLAGS_OF, false); if ((m->xedd->op.opcode & 1) && (m->sse.ie = ie) && !m->sse.im) { HaltMachine(m, kMachineSimdException); } } static float_v OpAddps(struct Machine *m, float_v x, float_v y) { return x + y; } static double_v OpAddpd(struct Machine *m, double_v x, double_v y) { return x + y; } static float_v OpMulps(struct Machine *m, float_v x, float_v y) { return x * y; } static double_v OpMulpd(struct Machine *m, double_v x, double_v y) { return x * y; } static float_v OpSubps(struct Machine *m, float_v x, float_v y) { return x - y; } static double_v OpSubpd(struct Machine *m, double_v x, double_v y) { return x - y; } static float_v OpDivps(struct Machine *m, float_v x, float_v y) { return x / y; } static double_v OpDivpd(struct Machine *m, double_v x, double_v y) { return x / y; } static float_v OpAndps(struct Machine *m, float_v x, float_v y) { return (float_v)((int_v)x & (int_v)y); } static double_v OpAndpd(struct Machine *m, double_v x, double_v y) { return (double_v)((long_v)x & (long_v)y); } static float_v OpAndnps(struct Machine *m, float_v x, float_v y) { return (float_v)(~(int_v)x & (int_v)y); } static double_v OpAndnpd(struct Machine *m, double_v x, double_v y) { return (double_v)(~(long_v)x & (long_v)y); } static float_v OpOrps(struct Machine *m, float_v x, float_v y) { return (float_v)((int_v)x | (int_v)y); } static double_v OpOrpd(struct Machine *m, double_v x, double_v y) { return (double_v)((long_v)x | (long_v)y); } static float_v OpXorps(struct Machine *m, float_v x, float_v y) { return (float_v)((int_v)x ^ (int_v)y); } static double_v OpXorpd(struct Machine *m, double_v x, double_v y) { return (double_v)((long_v)x ^ (long_v)y); } static double_v OpHaddpd(struct Machine *m, double_v x, double_v y) { return (double_v){x[0] + x[1], y[0] + y[1]}; } static float_v OpHaddps(struct Machine *m, float_v x, float_v y) { return (float_v){x[0] + x[1], x[2] + x[3], y[0] + y[1], y[2] + y[3]}; } static double_v OpHsubpd(struct Machine *m, double_v x, double_v y) { return (double_v){x[0] - x[1], y[0] - y[1]}; } static float_v OpHsubps(struct Machine *m, float_v x, float_v y) { return (float_v){x[0] - x[1], x[2] - x[3], y[0] - y[1], y[2] - y[3]}; } static double_v OpAddsubpd(struct Machine *m, double_v x, double_v y) { return (double_v){x[0] - y[0], x[1] + y[1]}; } static float_v OpAddsubps(struct Machine *m, float_v x, float_v y) { return (float_v){x[0] - y[0], x[1] + y[1], x[2] - y[2], x[3] + y[3]}; } static float_v OpMinps(struct Machine *m, float_v x, float_v y) { int i; for (i = 0; i < 4; ++i) { x[i] = MIN(x[i], y[i]); } return x; } static double_v OpMinpd(struct Machine *m, double_v x, double_v y) { int i; for (i = 0; i < 4; ++i) { x[i] = MIN(x[i], y[i]); } return x; } static float_v OpMaxps(struct Machine *m, float_v x, float_v y) { int i; for (i = 0; i < 4; ++i) { x[i] = MAX(x[i], y[i]); } return x; } static double_v OpMaxpd(struct Machine *m, double_v x, double_v y) { int i; for (i = 0; i < 4; ++i) { x[i] = MAX(x[i], y[i]); } return x; } static float_v OpCmpps(struct Machine *m, float_v x, float_v y) { long i; switch (m->xedd->op.uimm0) { case 0: return x == y; case 1: return x < y; case 2: return x <= y; case 3: for (i = 0; i < 4; ++i) { x[i] = isnan(x[i]) || isnan(y[i]); } return x; case 4: return x != y; case 5: return x >= y; case 6: return x > y; case 7: for (i = 0; i < 4; ++i) { x[i] = !(isnan(x[i]) || isnan(y[i])); } return x; default: OpUd(m); } } static double_v OpCmppd(struct Machine *m, double_v x, double_v y) { long i; switch (m->xedd->op.uimm0) { case 0: return x == y; case 1: return x < y; case 2: return x <= y; case 3: for (i = 0; i < 2; ++i) { x[i] = isnan(x[i]) || isnan(y[i]); } return x; case 4: return x != y; case 5: return x >= y; case 6: return x > y; case 7: for (i = 0; i < 2; ++i) { x[i] = !(isnan(x[i]) || isnan(y[i])); } return x; default: OpUd(m); } } static void OpAddpsd(struct Machine *m) { OpVspsdWspsd(m, OpAddps, OpAddpd); } static void OpMulpsd(struct Machine *m) { OpVspsdWspsd(m, OpMulps, OpMulpd); } static void OpSubpsd(struct Machine *m) { OpVspsdWspsd(m, OpSubps, OpSubpd); } static void OpDivpsd(struct Machine *m) { OpVspsdWspsd(m, OpDivps, OpDivpd); } static void OpMinpsd(struct Machine *m) { OpVspsdWspsd(m, OpMinps, OpMinpd); } static void OpMaxpsd(struct Machine *m) { OpVspsdWspsd(m, OpMaxps, OpMaxpd); } static void OpCmppsd(struct Machine *m) { OpVspsdWspsd(m, OpCmpps, OpCmppd); } static void OpAndpsd(struct Machine *m) { OpVpsdWpsd66(m, OpAndps, OpAndpd); } static void OpAndnpsd(struct Machine *m) { OpVpsdWpsd66(m, OpAndnps, OpAndnpd); } static void OpOrpsd(struct Machine *m) { OpVpsdWpsd66(m, OpOrps, OpOrpd); } static void OpXorpsd(struct Machine *m) { OpVpsdWpsd66(m, OpXorps, OpXorpd); } static void OpHaddpsd(struct Machine *m) { OpVpsdWpsd66f2(m, OpHaddps, OpHaddpd); } static void OpHsubpsd(struct Machine *m) { OpVpsdWpsd66f2(m, OpHsubps, OpHsubpd); } static void OpAddsubpsd(struct Machine *m) { OpVpsdWpsd66f2(m, OpAddsubps, OpAddsubpd); } static void OpAluw(struct Machine *m, int64_t f(int, int, uint64_t, uint64_t, uint32_t *), int h) { int64_t v; void *p[2]; uint64_t x, y, z; uint8_t w, *a, *b, *c, split[8]; w = RegLog2(m->xedd); if (ModrmMod(m->xedd) != 0b11) { v = ComputeAddress(m); if (h & ALU_FLIP) { a = Load(m, v, 1 << w, split); } else { a = BeginLoadStore(m, v, 1 << w, p, split); } } else { v = 0; a = RegRexbRm(m); } b = RegRexrReg(m); if (h & ALU_FLIP) { c = b; b = a; a = c; } y = Read64(b); x = Read64(a); z = f(w, h, x, y, &m->flags); switch (w) { case 0: Write8(a, z); break; case 1: Write16(a, z); break; case 2: case 3: Write64(a, z); break; default: unreachable; } EndStore(m, v, 1 << w, p, split); if (h & ALU_XCHG) { switch (w) { case 0: Write8(b, x); break; case 1: Write16(b, x); break; case 2: case 3: Write64(b, x); break; default: unreachable; } } } static void OpAlub(struct Machine *m, int64_t f(int, int, uint64_t, uint64_t, uint32_t *), int h) { int64_t v; uint64_t x, y, z; uint8_t *a, *b, *c; if (!m->xedd->op.has_modrm || IsModrmRegister(m->xedd)) { a = ByteRexbRm(m); } else { v = ComputeAddress(m); a = ResolveAddress(m, v); if (h & ALU_FLIP) { SetReadAddr(m, v, 1); } else { SetWriteAddr(m, v, 1); } } b = ByteRexrReg(m); if (h & ALU_FLIP) { c = b; b = a; a = c; } y = Read8(b); x = Read8(a); z = f(0, h, x, y, &m->flags); Write8(a, z); if (h & ALU_XCHG) Write8(b, x); } static void OpAluwi(struct Machine *m, int64_t f(int, int, uint64_t, uint64_t, uint32_t *), int h, uint64_t yimm) { int64_t v; void *p[2]; uint64_t x, y, z; uint8_t w, *a, *c, split[8]; w = RegLog2(m->xedd); if (m->xedd->op.has_modrm && ModrmMod(m->xedd) != 0b11) { v = ComputeAddress(m); a = BeginLoadStore(m, v, 1 << w, p, split); } else { v = 0; a = RegRexbRm(m); } y = yimm; x = Read64(a); z = f(w, h, x, y, &m->flags); switch (w) { case 0: Write8(a, z); break; case 1: Write16(a, z); break; case 2: case 3: Write64(a, z); break; default: unreachable; } EndStore(m, v, 1 << w, p, split); } static void OpAlubi(struct Machine *m, int64_t f(int, int, uint64_t, uint64_t, uint32_t *), int h, uint64_t yimm) { int64_t v; uint64_t x, y, z; uint8_t *a, *b, *c; if (!m->xedd->op.has_modrm || IsModrmRegister(m->xedd)) { a = ByteRexbRm(m); } else { v = ComputeAddress(m); a = ResolveAddress(m, v); SetWriteAddr(m, v, 1); } y = yimm; b = NULL; x = Read8(a); z = f(0, h, x, y, &m->flags); Write8(a, z); } static void ExecuteInstructionMap0(struct Machine *m) { switch (m->xedd->op.opcode) { CASE(/*0120 0x50*/ 0b01010000 ... 0x57, OpPushZvq(m)); CASE(/*0130 0x58*/ 0b01011000 ... 0x5f, OpPopZvq(m)); CASE(/*0143 0x63*/ 0b01100011, OpMovsxdGdqpEd(m)); CASE(/*0150 0x68*/ 0b01101000, PushOsz(m, m->xedd->op.uimm0)); CASE(/*0151 0x69*/ 0b01101001, OpImulGvqpEvqpImm(m)); CASE(/*0152 0x6A*/ 0b01101010, PushOsz(m, m->xedd->op.uimm0)); CASE(/*0153 0x6B*/ 0b01101011, OpImulGvqpEvqpImm(m)); CASE(/*0154 0x6C*/ 0b01101100, OpString(m, STRING_INS)); CASE(/*0155 0x6D*/ 0b01101101, OpString(m, STRING_INS)); CASE(/*0156 0x6E*/ 0b01101110, OpString(m, STRING_OUTS)); CASE(/*0157 0x6F*/ 0b01101111, OpString(m, STRING_OUTS)); CASE(/*0160 0x70*/ 0b01110000, if (GetCond(m, 0x0)) OpJmp(m)); CASE(/*0161 0x71*/ 0b01110001, if (GetCond(m, 0x1)) OpJmp(m)); CASE(/*0162 0x72*/ 0b01110010, if (GetCond(m, 0x2)) OpJmp(m)); CASE(/*0163 0x73*/ 0b01110011, if (GetCond(m, 0x3)) OpJmp(m)); CASE(/*0164 0x74*/ 0b01110100, if (GetCond(m, 0x4)) OpJmp(m)); CASE(/*0165 0x75*/ 0b01110101, if (GetCond(m, 0x5)) OpJmp(m)); CASE(/*0166 0x76*/ 0b01110110, if (GetCond(m, 0x6)) OpJmp(m)); CASE(/*0167 0x77*/ 0b01110111, if (GetCond(m, 0x7)) OpJmp(m)); CASE(/*0170 0x78*/ 0b01111000, if (GetCond(m, 0x8)) OpJmp(m)); CASE(/*0171 0x79*/ 0b01111001, if (GetCond(m, 0x9)) OpJmp(m)); CASE(/*0172 0x7A*/ 0b01111010, if (GetCond(m, 0xa)) OpJmp(m)); CASE(/*0173 0x7B*/ 0b01111011, if (GetCond(m, 0xb)) OpJmp(m)); CASE(/*0174 0x7C*/ 0b01111100, if (GetCond(m, 0xc)) OpJmp(m)); CASE(/*0175 0x7D*/ 0b01111101, if (GetCond(m, 0xd)) OpJmp(m)); CASE(/*0176 0x7E*/ 0b01111110, if (GetCond(m, 0xe)) OpJmp(m)); CASE(/*0177 0x7F*/ 0b01111111, if (GetCond(m, 0xf)) OpJmp(m)); CASE(/*0200 0x80*/ 0b10000000, OpAlubi(m, Alu, ModrmReg(m->xedd), UIMM0)); CASE(/*0201 0x81*/ 0b10000001, OpAluwi(m, Alu, ModrmReg(m->xedd), UIMM0)); CASE(/*0202 0x82*/ 0b10000010, OpAlubi(m, Alu, ModrmReg(m->xedd), UIMM0)); CASE(/*0203 0x83*/ 0b10000011, OpAluwi(m, Alu, ModrmReg(m->xedd), UIMM0)); CASE(/*0204 0x84*/ 0b10000100, OpAlub(m, Alu, ALU_TEST | ALU_AND)); CASE(/*0205 0x85*/ 0b10000101, OpAluw(m, Alu, ALU_TEST | ALU_AND)); CASE(/*0206 0x86*/ 0b10000110, OpXchgGbEb(m)); CASE(/*0207 0x87*/ 0b10000111, OpXchgGvqpEvqp(m)); CASE(/*0210 0x88*/ 0b10001000, OpMovEbGb(m)); CASE(/*0211 0x89*/ 0b10001001, OpMovEvqpGvqp(m)); CASE(/*0212 0x8A*/ 0b10001010, OpMovGbEb(m)); CASE(/*0213 0x8B*/ 0b10001011, OpMovGvqpEvqp(m)); CASE(/*0214 0x8C*/ 0b10001100, OpMovEvqpSw(m)); CASE(/*0215 0x8D*/ 0b10001101, OpLeaGvqpM(m)); CASE(/*0216 0x8E*/ 0b10001110, OpMovSwEvqp(m)); CASE(/*0217 0x8F*/ 0b10001111, OpPopEvq(m)); CASE(/*0220 0x90*/ 0b10010000, OpNop(m)); CASE(/*0221 0x91*/ 0b10010001 ... 0x97, OpXchgZvqp(m)); CASE(/*0230 0x98*/ 0b10011000, OpConvert1(m)); CASE(/*0231 0x99*/ 0b10011001, OpConvert2(m)); CASE(/*0234 0x9C*/ 0b10011100, OpPushf(m)); CASE(/*0235 0x9D*/ 0b10011101, OpPopf(m)); CASE(/*0236 0x9E*/ 0b10011110, OpSahf(m)); CASE(/*0237 0x9F*/ 0b10011111, OpLahf(m)); CASE(/*0233 0x9b*/ 0b10011011, OpFwait(m)); CASE(/*0240 0xA0*/ 0b10100000, OpMovAlOb(m)); CASE(/*0241 0xA1*/ 0b10100001, OpMovRaxOvqp(m)); CASE(/*0242 0xA2*/ 0b10100010, OpMovObAl(m)); CASE(/*0243 0xA3*/ 0b10100011, OpMovOvqpRax(m)); CASE(/*0244 0xA4*/ 0b10100100, OpMovsb(m)); CASE(/*0245 0xA5*/ 0b10100101, OpString(m, STRING_MOVS)); CASE(/*0246 0xA6*/ 0b10100110, OpString(m, STRING_CMPS)); CASE(/*0247 0xA7*/ 0b10100111, OpString(m, STRING_CMPS)); CASE(/*0250 0xA8*/ 0b10101000, OpAlubi(m, Alu, ALU_TEST | ALU_AND, UIMM0)); CASE(/*0251 0xA9*/ 0b10101001, OpAluwi(m, Alu, ALU_TEST | ALU_AND, UIMM0)); CASE(/*0252 0xAA*/ 0b10101010, OpStosb(m)); CASE(/*0253 0xAB*/ 0b10101011, OpString(m, STRING_STOS)); CASE(/*0254 0xAC*/ 0b10101100, OpString(m, STRING_LODS)); CASE(/*0255 0xAD*/ 0b10101101, OpString(m, STRING_LODS)); CASE(/*0256 0xAE*/ 0b10101110, OpString(m, STRING_SCAS)); CASE(/*0257 0xAF*/ 0b10101111, OpString(m, STRING_SCAS)); CASE(/*0260 0xB0*/ 0b10110000 ... 0b10110111, OpMovZbIb(m)); CASE(/*0270 0xB8*/ 0b10111000 ... 0b10111111, OpMovZvqpIvqp(m)); CASE(/*0300 0xC0*/ 0b11000000, OpAlubi(m, Bsu, ModrmReg(m->xedd), UIMM0)); CASE(/*0301 0xC1*/ 0b11000001, OpAluwi(m, Bsu, ModrmReg(m->xedd), UIMM0)); CASE(/*0302 0xC2*/ 0b11000010, OpRet(m, m->xedd->op.uimm0)); CASE(/*0303 0xC3*/ 0b11000011, OpRet(m, 0)); CASE(/*0306 0xC6*/ 0b11000110, OpMovEbIb(m)); CASE(/*0307 0xC7*/ 0b11000111, OpMovEvqpIvds(m)); CASE(/*0311 0xC9*/ 0b11001001, OpLeave(m)); CASE(/*0314 0xCC*/ 0b11001100, OpInterrupt(m, 3)); CASE(/*0315 0xCD*/ 0b11001101, OpInterrupt(m, m->xedd->op.uimm0)); CASE(/*0320 0xD0*/ 0b11010000, OpAlubi(m, Bsu, ModrmReg(m->xedd), 1)); CASE(/*0321 0xD1*/ 0b11010001, OpAluwi(m, Bsu, ModrmReg(m->xedd), 1)); CASE(/*0322 0xD2*/ 0b11010010, OpAlubi(m, Bsu, REG, m->cx[0])); CASE(/*0323 0xD3*/ 0b11010011, OpAluwi(m, Bsu, REG, m->cx[0])); CASE(/*0327 0xD7*/ 0b11010111, OpXlat(m)); CASE(/*0340 0xE0*/ 0b11100000, OpLoop(m, !GetFlag(m->flags, FLAGS_ZF))); CASE(/*0341 0xE1*/ 0b11100001, OpLoop(m, GetFlag(m->flags, FLAGS_ZF))); CASE(/*0342 0xE2*/ 0b11100010, OpLoop(m, 1)); CASE(/*0343 0xE3*/ 0b11100011, OpJcxz(m)); CASE(/*0344 0xE4*/ 0b11100100, Write8(m->ax, OpIn(m, UIMM0))); CASE(/*0345 0xE5*/ 0b11100101, Write32(m->ax, OpIn(m, UIMM0))); CASE(/*0346 0xE6*/ 0b11100110, OpOut(m, UIMM0, Read8(m->ax))); CASE(/*0347 0xE7*/ 0b11100111, OpOut(m, UIMM0, Read32(m->ax))); CASE(/*0350 0xE8*/ 0b11101000, OpCallJvds(m)); CASE(/*0351 0xE9*/ 0b11101001, OpJmp(m)); CASE(/*0353 0xEB*/ 0b11101011, OpJmp(m)); CASE(/*0354 0xEC*/ 0b11101100, Write8(m->ax, OpIn(m, Read16(m->dx)))); CASE(/*0355 0xED*/ 0b11101101, Write32(m->ax, OpIn(m, Read16(m->dx)))); CASE(/*0356 0xEE*/ 0b11101110, OpOut(m, Read16(m->dx), Read8(m->ax))); CASE(/*0357 0xEF*/ 0b11101111, OpOut(m, Read16(m->dx), Read32(m->ax))); CASE(/*0361 0xF1*/ 0b11110001, OpInterrupt(m, 1)); CASE(/*0364 0xF4*/ 0b11110100, OpHlt(m)); CASE(/*0365 0xF5*/ 0b11110101, OpCmc(m)); CASE(/*0370 0xF8*/ 0b11111000, OpClc(m)); CASE(/*0371 0xF9*/ 0b11111001, OpStc(m)); CASE(/*0372 0xFA*/ 0b11111010, OpCli(m)); CASE(/*0373 0xFB*/ 0b11111011, OpSti(m)); CASE(/*0374 0xFC*/ 0b11111100, OpCld(m)); CASE(/*0375 0xFD*/ 0b11111101, OpStd(m)); case /*0004 0x04*/ 0b00000100: case /*0014 0x0C*/ 0b00001100: case /*0024 0x14*/ 0b00010100: case /*0034 0x1C*/ 0b00011100: case /*0044 0x24*/ 0b00100100: case /*0054 0x2C*/ 0b00101100: case /*0064 0x34*/ 0b00110100: case /*0074 0x3C*/ 0b00111100: OpAlubi(m, Alu, (m->xedd->op.opcode & 070) >> 3, m->xedd->op.uimm0); break; case /*0005 0x05*/ 0b00000101: case /*0015 0x0D*/ 0b00001101: case /*0025 0x15*/ 0b00010101: case /*0035 0x1D*/ 0b00011101: case /*0045 0x25*/ 0b00100101: case /*0055 0x2D*/ 0b00101101: case /*0065 0x35*/ 0b00110101: case /*0075 0x3D*/ 0b00111101: OpAluwi(m, Alu, (m->xedd->op.opcode & 070) >> 3, m->xedd->op.uimm0); break; case /*0000 0x00*/ 0b00000000: case /*0002 0x02*/ 0b00000010: case /*0010 0x08*/ 0b00001000: case /*0012 0x0A*/ 0b00001010: case /*0020 0x10*/ 0b00010000: case /*0022 0x12*/ 0b00010010: case /*0030 0x18*/ 0b00011000: case /*0032 0x1A*/ 0b00011010: case /*0040 0x20*/ 0b00100000: case /*0042 0x22*/ 0b00100010: case /*0050 0x28*/ 0b00101000: case /*0052 0x2A*/ 0b00101010: case /*0060 0x30*/ 0b00110000: case /*0062 0x32*/ 0b00110010: case /*0070 0x38*/ 0b00111000: case /*0072 0x3A*/ 0b00111010: OpAlub(m, Alu, ((m->xedd->op.opcode & 070) >> 3 | (m->xedd->op.opcode & 0b010 ? ALU_FLIP : 0))); break; case /*0001 0x01*/ 0b00000001: case /*0003 0x03*/ 0b00000011: case /*0011 0x09*/ 0b00001001: case /*0013 0x0B*/ 0b00001011: case /*0021 0x11*/ 0b00010001: case /*0023 0x13*/ 0b00010011: case /*0031 0x19*/ 0b00011001: case /*0033 0x1B*/ 0b00011011: case /*0041 0x21*/ 0b00100001: case /*0043 0x23*/ 0b00100011: case /*0051 0x29*/ 0b00101001: case /*0053 0x2B*/ 0b00101011: case /*0061 0x31*/ 0b00110001: case /*0063 0x33*/ 0b00110011: case /*0071 0x39*/ 0b00111001: case /*0073 0x3B*/ 0b00111011: OpAluw(m, Alu, ((m->xedd->op.opcode & 070) >> 3 | (m->xedd->op.opcode & 0b010 ? ALU_FLIP : 0))); break; case /*0330 0xD8*/ 0b11011000: case /*0331 0xD9*/ 0b11011001: case /*0332 0xDA*/ 0b11011010: case /*0333 0xDB*/ 0b11011011: case /*0334 0xDC*/ 0b11011100: case /*0335 0xDD*/ 0b11011101: case /*0336 0xDE*/ 0b11011110: case /*0337 0xDF*/ 0b11011111: OpFpu(m); break; case /*0366 0xF6*/ 0b11110110: switch (ModrmReg(m->xedd)) { CASE(0, OpAlubi(m, Alu, ALU_TEST | ALU_AND, UIMM0)); CASE(1, OpAlubi(m, Alu, ALU_TEST | ALU_AND, UIMM0)); CASE(2, OpEb(m, AluNot)); CASE(3, OpEb(m, AluNeg)); CASE(4, OpMulAxAlEbUnsigned(m)); CASE(5, OpMulAxAlEbSigned(m)); CASE(6, OpDivAlAhAxEbUnsigned(m)); CASE(7, OpDivAlAhAxEbSigned(m)); default: unreachable; } break; case /*0367 0xF7*/ 0b11110111: switch (ModrmReg(m->xedd)) { CASE(0, OpAluwi(m, Alu, ALU_TEST | ALU_AND, UIMM0)); CASE(1, OpAluwi(m, Alu, ALU_TEST | ALU_AND, UIMM0)); CASE(2, OpEvqp(m, AluNot)); CASE(3, OpEvqp(m, AluNeg)); CASE(4, OpMulRdxRaxEvqpUnsigned(m)); CASE(5, OpMulRdxRaxEvqpSigned(m)); CASE(6, OpDivRdxRaxEvqpUnsigned(m)); CASE(7, OpDivRdxRaxEvqpSigned(m)); default: unreachable; } break; case /*0376 0xFE*/ 0b11111110: switch (ModrmReg(m->xedd)) { CASE(0b000, OpEb(m, AluInc)); CASE(0b001, OpEb(m, AluDec)); default: OpUd(m); } break; case /*0377 0xFF*/ 0b11111111: switch (ModrmReg(m->xedd)) { CASE(0, OpEvqp(m, AluInc)); CASE(1, OpEvqp(m, AluDec)); CASE(2, OpCallEq(m)); CASE(4, OpJmpEq(m)); CASE(6, OpPushEvq(m)); default: OpUd(m); } break; default: OpUd(m); } } static void ExecuteInstructionMap1(struct Machine *m) { switch (m->xedd->op.opcode) { CASE(/*0005 0x05*/ 0b00000101, OpSyscall(m)); CASE(/*0020 0x10*/ 0b00010000, OpMov0f10(m)); CASE(/*0021 0x11*/ 0b00010001, OpMovWpsVps(m)); CASE(/*0022 0x12*/ 0b00010010, OpMov0f12(m)); CASE(/*0023 0x13*/ 0b00010011, OpMov0f13(m)); CASE(/*0024 0x14*/ 0b00010100, OpUnpcklpsd(m)); CASE(/*0025 0x15*/ 0b00010101, OpUnpckhpsd(m)); CASE(/*0026 0x16*/ 0b00010110, OpMov0f16(m)); CASE(/*0027 0x17*/ 0b00010111, OpMov0f17(m)); CASE(/*0050 0x28*/ 0b00101000, OpMov0f28(m)); CASE(/*0051 0x29*/ 0b00101001, OpMovWpsVps(m)); CASE(/*0052 0x2A*/ 0b00101010, OpCvt(m, kOpCvt0f2a)); CASE(/*0053 0x2B*/ 0b00101011, OpMov0f2b(m)); CASE(/*0054 0x2C*/ 0b00101100, OpCvt(m, kOpCvtt0f2c)); CASE(/*0055 0x2D*/ 0b00101101, OpCvt(m, kOpCvt0f2d)); CASE(/*0056 0x2E*/ 0b00101110, OpComissVsWs(m)); CASE(/*0057 0x2F*/ 0b00101111, OpComissVsWs(m)); CASE(/*0061 0x31*/ 0b00110001, OpRdtsc(m)); CASE(/*0100 0x40*/ 0b01000000, if (GetCond(m, 0x0)) OpMovGvqpEvqp(m)); CASE(/*0101 0x41*/ 0b01000001, if (GetCond(m, 0x1)) OpMovGvqpEvqp(m)); CASE(/*0102 0x42*/ 0b01000010, if (GetCond(m, 0x2)) OpMovGvqpEvqp(m)); CASE(/*0103 0x43*/ 0b01000011, if (GetCond(m, 0x3)) OpMovGvqpEvqp(m)); CASE(/*0104 0x44*/ 0b01000100, if (GetCond(m, 0x4)) OpMovGvqpEvqp(m)); CASE(/*0105 0x45*/ 0b01000101, if (GetCond(m, 0x5)) OpMovGvqpEvqp(m)); CASE(/*0106 0x46*/ 0b01000110, if (GetCond(m, 0x6)) OpMovGvqpEvqp(m)); CASE(/*0107 0x47*/ 0b01000111, if (GetCond(m, 0x7)) OpMovGvqpEvqp(m)); CASE(/*0110 0x48*/ 0b01001000, if (GetCond(m, 0x8)) OpMovGvqpEvqp(m)); CASE(/*0111 0x49*/ 0b01001001, if (GetCond(m, 0x9)) OpMovGvqpEvqp(m)); CASE(/*0112 0x4a*/ 0b01001010, if (GetCond(m, 0xa)) OpMovGvqpEvqp(m)); CASE(/*0113 0x4b*/ 0b01001011, if (GetCond(m, 0xb)) OpMovGvqpEvqp(m)); CASE(/*0114 0x4c*/ 0b01001100, if (GetCond(m, 0xc)) OpMovGvqpEvqp(m)); CASE(/*0115 0x4d*/ 0b01001101, if (GetCond(m, 0xd)) OpMovGvqpEvqp(m)); CASE(/*0116 0x4e*/ 0b01001110, if (GetCond(m, 0xe)) OpMovGvqpEvqp(m)); CASE(/*0117 0x4f*/ 0b01001111, if (GetCond(m, 0xf)) OpMovGvqpEvqp(m)); CASE(/*0121 0x51*/ 0b01010001, OpSqrtpsd(m)); CASE(/*0122 0x52*/ 0b01010010, OpRsqrtps(m)); CASE(/*0123 0x53*/ 0b01010011, OpRcpps(m)); CASE(/*0124 0x54*/ 0b01010100, OpAndpsd(m)); CASE(/*0125 0x55*/ 0b01010101, OpAndnpsd(m)); CASE(/*0126 0x56*/ 0b01010110, OpOrpsd(m)); CASE(/*0127 0x57*/ 0b01010111, OpXorpsd(m)); CASE(/*0130 0x58*/ 0b01011000, OpAddpsd(m)); CASE(/*0131 0x59*/ 0b01011001, OpMulpsd(m)); CASE(/*0132 0x5A*/ 0b01011010, OpCvt(m, kOpCvt0f5a)); CASE(/*0133 0x5B*/ 0b01011011, OpCvt(m, kOpCvt0f5b)); CASE(/*0134 0x5C*/ 0b01011100, OpSubpsd(m)); CASE(/*0135 0x5D*/ 0b01011101, OpMinpsd(m)); CASE(/*0136 0x5E*/ 0b01011110, OpDivpsd(m)); CASE(/*0137 0x5F*/ 0b01011111, OpMaxpsd(m)); CASE(/*0140 0x60*/ 0b01100000, OpSse(m, kOpSsePunpcklbw)); CASE(/*0141 0x61*/ 0b01100001, OpSse(m, kOpSsePunpcklwd)); CASE(/*0142 0x62*/ 0b01100010, OpSse(m, kOpSsePunpckldq)); CASE(/*0143 0x63*/ 0b01100011, OpSse(m, kOpSsePacksswb)); CASE(/*0144 0x64*/ 0b01100100, OpSse(m, kOpSsePcmpgtb)); CASE(/*0145 0x65*/ 0b01100101, OpSse(m, kOpSsePcmpgtw)); CASE(/*0146 0x66*/ 0b01100110, OpSse(m, kOpSsePcmpgtd)); CASE(/*0147 0x67*/ 0b01100111, OpSse(m, kOpSsePackuswb)); CASE(/*0150 0x68*/ 0b01101000, OpSse(m, kOpSsePunpckhbw)); CASE(/*0151 0x69*/ 0b01101001, OpSse(m, kOpSsePunpckhwd)); CASE(/*0152 0x6A*/ 0b01101010, OpSse(m, kOpSsePunpckhdq)); CASE(/*0153 0x6B*/ 0b01101011, OpSse(m, kOpSsePackssdw)); CASE(/*0154 0x6C*/ 0b01101100, OpSse(m, kOpSsePunpcklqdq)); CASE(/*0155 0x6D*/ 0b01101101, OpSse(m, kOpSsePunpckhqdq)); CASE(/*0156 0x6E*/ 0b01101110, OpMov0f6e(m)); CASE(/*0157 0x6F*/ 0b01101111, OpMov0f6f(m)); CASE(/*0160 0x70*/ 0b01110000, OpShuffle(m)); CASE(/*0164 0x74*/ 0b01110100, OpSse(m, kOpSsePcmpeqb)); CASE(/*0165 0x75*/ 0b01110101, OpSse(m, kOpSsePcmpeqw)); CASE(/*0166 0x76*/ 0b01110110, OpSse(m, kOpSsePcmpeqd)); CASE(/*0174 0x7C*/ 0b01111100, OpHaddpsd(m)); CASE(/*0175 0x7D*/ 0b01111101, OpHsubpsd(m)); CASE(/*0176 0x7E*/ 0b01111110, OpMov0f7e(m)); CASE(/*0177 0x7F*/ 0b01111111, OpMov0f7f(m)); CASE(/*0200 0x80*/ 0b10000000, if (GetCond(m, 0x0)) OpJmp(m)); CASE(/*0201 0x81*/ 0b10000001, if (GetCond(m, 0x1)) OpJmp(m)); CASE(/*0202 0x82*/ 0b10000010, if (GetCond(m, 0x2)) OpJmp(m)); CASE(/*0203 0x83*/ 0b10000011, if (GetCond(m, 0x3)) OpJmp(m)); CASE(/*0204 0x84*/ 0b10000100, if (GetCond(m, 0x4)) OpJmp(m)); CASE(/*0205 0x85*/ 0b10000101, if (GetCond(m, 0x5)) OpJmp(m)); CASE(/*0206 0x86*/ 0b10000110, if (GetCond(m, 0x6)) OpJmp(m)); CASE(/*0207 0x87*/ 0b10000111, if (GetCond(m, 0x7)) OpJmp(m)); CASE(/*0210 0x88*/ 0b10001000, if (GetCond(m, 0x8)) OpJmp(m)); CASE(/*0211 0x89*/ 0b10001001, if (GetCond(m, 0x9)) OpJmp(m)); CASE(/*0212 0x8a*/ 0b10001010, if (GetCond(m, 0xa)) OpJmp(m)); CASE(/*0213 0x8b*/ 0b10001011, if (GetCond(m, 0xb)) OpJmp(m)); CASE(/*0214 0x8c*/ 0b10001100, if (GetCond(m, 0xc)) OpJmp(m)); CASE(/*0215 0x8d*/ 0b10001101, if (GetCond(m, 0xd)) OpJmp(m)); CASE(/*0216 0x8e*/ 0b10001110, if (GetCond(m, 0xe)) OpJmp(m)); CASE(/*0217 0x8f*/ 0b10001111, if (GetCond(m, 0xf)) OpJmp(m)); CASE(/*0220 0x90*/ 0b10010000, OpEbSetCc(m, GetCond(m, 0x0))); CASE(/*0221 0x91*/ 0b10010001, OpEbSetCc(m, GetCond(m, 0x1))); CASE(/*0222 0x92*/ 0b10010010, OpEbSetCc(m, GetCond(m, 0x2))); CASE(/*0223 0x93*/ 0b10010011, OpEbSetCc(m, GetCond(m, 0x3))); CASE(/*0224 0x94*/ 0b10010100, OpEbSetCc(m, GetCond(m, 0x4))); CASE(/*0225 0x95*/ 0b10010101, OpEbSetCc(m, GetCond(m, 0x5))); CASE(/*0226 0x96*/ 0b10010110, OpEbSetCc(m, GetCond(m, 0x6))); CASE(/*0227 0x97*/ 0b10010111, OpEbSetCc(m, GetCond(m, 0x7))); CASE(/*0230 0x98*/ 0b10011000, OpEbSetCc(m, GetCond(m, 0x8))); CASE(/*0231 0x99*/ 0b10011001, OpEbSetCc(m, GetCond(m, 0x9))); CASE(/*0232 0x9A*/ 0b10011010, OpEbSetCc(m, GetCond(m, 0xa))); CASE(/*0233 0x9B*/ 0b10011011, OpEbSetCc(m, GetCond(m, 0xb))); CASE(/*0234 0x9C*/ 0b10011100, OpEbSetCc(m, GetCond(m, 0xc))); CASE(/*0235 0x9D*/ 0b10011101, OpEbSetCc(m, GetCond(m, 0xd))); CASE(/*0236 0x9E*/ 0b10011110, OpEbSetCc(m, GetCond(m, 0xe))); CASE(/*0237 0x9F*/ 0b10011111, OpEbSetCc(m, GetCond(m, 0xf))); CASE(/*0240 0xA0*/ 0b10100000, OpPushFs(m)); CASE(/*0241 0xA1*/ 0b10100001, OpPopFs(m)); CASE(/*0242 0xA2*/ 0b10100010, OpCpuid(m)); CASE(/*0243 0xA3*/ 0b10100011, OpBit(m)); CASE(/*0250 0xA8*/ 0b10101000, OpPushGs(m)); CASE(/*0251 0xA9*/ 0b10101001, OpPopGs(m)); CASE(/*0253 0xAB*/ 0b10101011, OpBit(m)); CASE(/*0257 0xAF*/ 0b10101111, OpImulGvqpEvqp(m)); CASE(/*0260 0xB0*/ 0b10110000, OpCmpxchgEbAlGb(m)); CASE(/*0261 0xB1*/ 0b10110001, OpCmpxchgEvqpRaxGvqp(m)); CASE(/*0263 0xB3*/ 0b10110011, OpBit(m)); CASE(/*0266 0xB6*/ 0b10110110, OpMovzbGvqpEb(m)); CASE(/*0267 0xB7*/ 0b10110111, OpMovzwGvqpEw(m)); CASE(/*0272 0xBA*/ 0b10111010, OpBit(m)); CASE(/*0273 0xBB*/ 0b10111011, OpBit(m)); CASE(/*0274 0xBC*/ 0b10111100, OpGvqpEvqp(m, AluBsf, MUTATING)); CASE(/*0275 0xBD*/ 0b10111101, OpGvqpEvqp(m, AluBsr, MUTATING)); CASE(/*0276 0xBE*/ 0b10111110, OpMovsbGvqpEb(m)); CASE(/*0277 0xBF*/ 0b10111111, OpMovswGvqpEw(m)); CASE(/*0300 0xC0*/ 0b11000000, OpAlub(m, Alu, ALU_XCHG | ALU_ADD)); CASE(/*0301 0xC1*/ 0b11000001, OpAluw(m, Alu, ALU_XCHG | ALU_ADD)); CASE(/*0302 0xC2*/ 0b11000010, OpCmppsd(m)); CASE(/*0303 0xC3*/ 0b11000011, OpMovntiMdqpGdqp(m)); CASE(/*0304 0xC4*/ 0b11000100, OpPinsrwVdqEwIb(m)); CASE(/*0305 0xC5*/ 0b11000101, OpPextrwGdqpUdqIb(m)); CASE(/*0306 0xC6*/ 0b11000110, OpShufpsd(m)); CASE(/*0307 0xC7*/ 0b11000111, OpCmpxchgDxAx(m)); CASE(/*0310 0xC8*/ 0b11001000 ... 0b11001111, OpBswapZvqp(m)); CASE(/*0320 0xD0*/ 0b11010000, OpAddsubpsd(m)); CASE(/*0321 0xD1*/ 0b11010001, OpSse(m, kOpSsePsrlwv)); CASE(/*0322 0xD2*/ 0b11010010, OpSse(m, kOpSsePsrldv)); CASE(/*0323 0xD3*/ 0b11010011, OpSse(m, kOpSsePsrlqv)); CASE(/*0324 0xD4*/ 0b11010100, OpSse(m, kOpSsePaddq)); CASE(/*0325 0xD5*/ 0b11010101, OpSse(m, kOpSsePmullw)); CASE(/*0326 0xD6*/ 0b11010110, OpMov0fD6(m)); CASE(/*0327 0xD7*/ 0b11010111, OpPmovmskbGdqpNqUdq(m)); CASE(/*0330 0xD8*/ 0b11011000, OpSse(m, kOpSsePsubusb)); CASE(/*0331 0xD9*/ 0b11011001, OpSse(m, kOpSsePsubusw)); CASE(/*0332 0xDA*/ 0b11011010, OpSse(m, kOpSsePminub)); CASE(/*0333 0xDB*/ 0b11011011, OpSse(m, kOpSsePand)); CASE(/*0334 0xDC*/ 0b11011100, OpSse(m, kOpSsePaddusb)); CASE(/*0335 0xDD*/ 0b11011101, OpSse(m, kOpSsePaddusw)); CASE(/*0336 0xDE*/ 0b11011110, OpSse(m, kOpSsePmaxub)); CASE(/*0337 0xDF*/ 0b11011111, OpSse(m, kOpSsePandn)); CASE(/*0340 0xE0*/ 0b11100000, OpSse(m, kOpSsePavgb)); CASE(/*0341 0xE1*/ 0b11100001, OpSse(m, kOpSsePsrawv)); CASE(/*0342 0xE2*/ 0b11100010, OpSse(m, kOpSsePsradv)); CASE(/*0343 0xE3*/ 0b11100011, OpSse(m, kOpSsePavgw)); CASE(/*0344 0xE4*/ 0b11100100, OpSse(m, kOpSsePmulhuw)); CASE(/*0345 0xE5*/ 0b11100101, OpSse(m, kOpSsePmulhw)); CASE(/*0346 0xE6*/ 0b11100110, OpCvt(m, kOpCvt0fE6)); CASE(/*0347 0xE7*/ 0b11100111, OpMov0fE7(m)); CASE(/*0350 0xE8*/ 0b11101000, OpSse(m, kOpSsePsubsb)); CASE(/*0351 0xE9*/ 0b11101001, OpSse(m, kOpSsePsubsw)); CASE(/*0352 0xEA*/ 0b11101010, OpSse(m, kOpSsePminsw)); CASE(/*0353 0xEB*/ 0b11101011, OpSse(m, kOpSsePor)); CASE(/*0354 0xEC*/ 0b11101100, OpSse(m, kOpSsePaddsb)); CASE(/*0355 0xED*/ 0b11101101, OpSse(m, kOpSsePaddsw)); CASE(/*0356 0xEE*/ 0b11101110, OpSse(m, kOpSsePmaxsw)); CASE(/*0357 0xEF*/ 0b11101111, OpSse(m, kOpSsePxor)); CASE(/*0360 0xF0*/ 0b11110000, OpLddquVdqMdq(m)); CASE(/*0361 0xF1*/ 0b11110001, OpSse(m, kOpSsePsllwv)); CASE(/*0362 0xF2*/ 0b11110010, OpSse(m, kOpSsePslldv)); CASE(/*0363 0xF3*/ 0b11110011, OpSse(m, kOpSsePsllqv)); CASE(/*0364 0xF4*/ 0b11110100, OpSse(m, kOpSsePmuludq)); CASE(/*0365 0xF5*/ 0b11110101, OpSse(m, kOpSsePmaddwd)); CASE(/*0366 0xF6*/ 0b11110110, OpSse(m, kOpSsePsadbw)); CASE(/*0367 0xF7*/ 0b11110111, OpMaskMovDiXmmRegXmmRm(m)); CASE(/*0370 0xF8*/ 0b11111000, OpSse(m, kOpSsePsubb)); CASE(/*0371 0xF9*/ 0b11111001, OpSse(m, kOpSsePsubw)); CASE(/*0372 0xFA*/ 0b11111010, OpSse(m, kOpSsePsubd)); CASE(/*0373 0xFB*/ 0b11111011, OpSse(m, kOpSsePsubq)); CASE(/*0374 0xFC*/ 0b11111100, OpSse(m, kOpSsePaddb)); CASE(/*0375 0xFD*/ 0b11111101, OpSse(m, kOpSsePaddw)); CASE(/*0376 0xFE*/ 0b11111110, OpSse(m, kOpSsePaddd)); case /*0013 0x0B*/ 0b00001011: case /*0271 0xB9*/ 0b10111001: case /*0377 0xFF*/ 0b11111111: OpUd(m); break; case /*0015 0x0D*/ 0b00001101: case /*0030 0x18*/ 0b00011000: case /*0031 0x19*/ 0b00011001: case /*0032 0x1A*/ 0b00011010: case /*0033 0x1B*/ 0b00011011: case /*0034 0x1C*/ 0b00011100: case /*0035 0x1D*/ 0b00011101: OpWutNopEv(m); break; case /*0037 0x1F*/ 0b00011111: OpNopEv(m); break; case /*0161 0x71*/ 0b01110001: switch (ModrmReg(m->xedd)) { CASE(2, OpSseUdqIb(m, kOpSseUdqIbPsrlw)); CASE(4, OpSseUdqIb(m, kOpSseUdqIbPsraw)); CASE(6, OpSseUdqIb(m, kOpSseUdqIbPsllw)); default: OpUd(m); } break; case /*0162 0x72*/ 0b01110010: switch (ModrmReg(m->xedd)) { CASE(2, OpSseUdqIb(m, kOpSseUdqIbPsrld)); CASE(4, OpSseUdqIb(m, kOpSseUdqIbPsrad)); CASE(6, OpSseUdqIb(m, kOpSseUdqIbPslld)); default: OpUd(m); } break; case /*0163 0x73*/ 0b01110011: switch (ModrmReg(m->xedd)) { CASE(2, OpSseUdqIb(m, kOpSseUdqIbPsrlq)); CASE(3, OpSseUdqIb(m, kOpSseUdqIbPsrldq)); CASE(6, OpSseUdqIb(m, kOpSseUdqIbPsllq)); CASE(7, OpSseUdqIb(m, kOpSseUdqIbPslldq)); default: OpUd(m); } break; case /*0244 0xA4*/ 0b10100100: case /*0245 0xA5*/ 0b10100101: case /*0254 0xAC*/ 0b10101100: case /*0255 0xAD*/ 0b10101101: OpEvqpGvqp(m, OpDoubleShift, MUTATING); break; case /*0256 0xAE*/ 0b10101110: switch (ModrmReg(m->xedd)) { CASE(5, OpLfence(m)); CASE(6, OpMfence(m)); case 7: if (0xf8 <= m->xedd->op.modrm && m->xedd->op.modrm <= 0xff) { OpSfence(m); } else { OpClflush(m); } break; default: OpUd(m); } break; case 0xB8: if (m->xedd->op.ild_f3) { OpGvqpEvqp(m, AluPopcnt, MUTATING); } else { OpUd(m); } break; default: OpUd(m); } } static void ExecuteInstructionMap2(struct Machine *m) { switch (m->xedd->op.opcode) { CASE(0x00, OpSse(m, kOpSsePshufb)); CASE(0x01, OpSse(m, kOpSsePhaddw)); CASE(0x02, OpSse(m, kOpSsePhaddd)); CASE(0x03, OpSse(m, kOpSsePhaddsw)); CASE(0x04, OpSse(m, kOpSsePmaddubsw)); CASE(0x05, OpSse(m, kOpSsePhsubw)); CASE(0x06, OpSse(m, kOpSsePhsubd)); CASE(0x07, OpSse(m, kOpSsePhsubsw)); CASE(0x08, OpSse(m, kOpSsePsignb)); CASE(0x09, OpSse(m, kOpSsePsignw)); CASE(0x0A, OpSse(m, kOpSsePsignd)); CASE(0x0B, OpSse(m, kOpSsePmulhrsw)); CASE(0x1C, OpSse(m, kOpSsePabsb)); CASE(0x1D, OpSse(m, kOpSsePabsw)); CASE(0x1E, OpSse(m, kOpSsePabsd)); CASE(0x2A, OpMovntdqaVdqMdq(m)); CASE(0x40, OpSse(m, kOpSsePmulld)); default: OpUd(m); } } static void ExecuteInstructionMap3(struct Machine *m) { switch (m->xedd->op.opcode) { CASE(0x0F, OpSsePalignr(m)); default: OpUd(m); } } static void SaveStash(struct Machine *m) { VirtualRecv(m, m->stashaddr, m->stash, m->stashsize); m->stashaddr = 0; } void ExecuteInstruction(struct Machine *m) { m->ip += m->xedd->length; switch (m->xedd->op.map) { CASE(XED_ILD_MAP0, ExecuteInstructionMap0(m)); CASE(XED_ILD_MAP1, ExecuteInstructionMap1(m)); CASE(XED_ILD_MAP2, ExecuteInstructionMap2(m)); CASE(XED_ILD_MAP3, ExecuteInstructionMap3(m)); default: OpUd(m); } if (m->stashaddr) { SaveStash(m); } }