/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│ │vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│ ╞══════════════════════════════════════════════════════════════════════════════╡ │ Copyright 2018 Intel Corporation │ │ Copyright 2020 Justine Alexandra Roberts Tunney │ │ │ │ Licensed under the Apache License, Version 2.0 (the "License"); │ │ you may not use this file except in compliance with the License. │ │ You may obtain a copy of the License at │ │ │ │ http://www.apache.org/licenses/LICENSE-2.0 │ │ │ │ Unless required by applicable law or agreed to in writing, software │ │ distributed under the License is distributed on an "AS IS" BASIS, │ │ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. │ │ See the License for the specific language governing permissions and │ │ limitations under the License. │ ╚─────────────────────────────────────────────────────────────────────────────*/ #include "libc/assert.h" #include "libc/bits/bits.h" #include "libc/dce.h" #include "libc/macros.h" #include "libc/nexgen32e/bsr.h" #include "libc/runtime/runtime.h" #include "libc/str/str.h" #include "third_party/xed/avx.h" #include "third_party/xed/avx512.h" #include "third_party/xed/private.h" #include "third_party/xed/x86.h" asm(".ident\t\"\\n\\n\ Xed (Apache 2.0)\\n\ Copyright 2018 Intel Corporation\\n\ Copyright 2019 Justine Alexandra Roberts Tunney\\n\ Modifications: Trimmed down to 3kb [2019-03-22 jart]\""); asm(".include \"libc/disclaimer.inc\""); #define XED_ILD_HASMODRM_IGNORE_MOD 2 #define XED_I_LF_BRDISP8_BRDISP_WIDTH_CONST_l2 1 #define XED_I_LF_BRDISPz_BRDISP_WIDTH_OSZ_NONTERM_EOSZ_l2 2 #define XED_I_LF_DISP_BUCKET_0_l1 3 #define XED_I_LF_EMPTY_DISP_CONST_l2 4 #define XED_I_LF_MEMDISPv_DISP_WIDTH_ASZ_NONTERM_EASZ_l2 5 #define XED_I_LF_RESOLVE_BYREG_DISP_map0x0_op0xc7_l1 6 #define XED_I_LF_0_IMM_WIDTH_CONST_l2 1 #define XED_I_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xc7_l1 2 #define XED_I_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xf6_l1 3 #define XED_I_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xf7_l1 4 #define XED_I_LF_SIMM8_IMM_WIDTH_CONST_l2 5 #define XED_I_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_DF64_EOSZ_l2 6 #define XED_I_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2 7 #define XED_I_LF_UIMM16_IMM_WIDTH_CONST_l2 8 #define XED_I_LF_UIMM8_IMM_WIDTH_CONST_l2 9 #define XED_I_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2 10 #define xed_i_ild_hasimm_map0x0_op0xc8_l1 11 #define xed_i_ild_hasimm_map0x0F_op0x78_l1 12 #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_IGNORE66_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_IGNORE66_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_REFINING66_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_REFINING66_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_DF64_FORCE64_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_DF64_FORCE64_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_FORCE64_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_FORCE64_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_REFINING66_CR_WIDTH_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_REFINING66_CR_WIDTH_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_DF64_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_DF64_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_DF64_IMMUNE66_LOOP64_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_DF64_IMMUNE66_LOOP64_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_IMMUNE66_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_IMMUNE66_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_CR_WIDTH_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_CR_WIDTH_EOSZ) #define XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_IMMUNE_REXW_EOSZ_l2(X) \ xed_set_simmz_imm_width_eosz(X, kXed.OSZ_NONTERM_IMMUNE_REXW_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_IGNORE66_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_IGNORE66_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_REFINING66_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_REFINING66_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_DF64_FORCE64_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_DF64_FORCE64_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_FORCE64_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_FORCE64_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_REFINING66_CR_WIDTH_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_REFINING66_CR_WIDTH_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_DF64_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_DF64_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_DF64_IMMUNE66_LOOP64_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_DF64_IMMUNE66_LOOP64_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_IMMUNE66_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_IMMUNE66_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_CR_WIDTH_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_CR_WIDTH_EOSZ) #define XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_IMMUNE_REXW_EOSZ_l2(X) \ xed_set_uimmv_imm_width_eosz(X, kXed.OSZ_NONTERM_IMMUNE_REXW_EOSZ) extern const uint32_t xed_prefix_table_bit[8] hidden; extern const uint8_t xed_imm_bits_2d[2][256] hidden; extern const uint8_t xed_has_modrm_2d[XED_ILD_MAP2][256] hidden; extern const uint8_t xed_has_sib_table[3][4][8] hidden; extern const uint8_t xed_has_disp_regular[3][4][8] hidden; extern const uint8_t xed_disp_bits_2d[XED_ILD_MAP2][256] hidden; static const struct XedDenseMagnums { unsigned vex_prefix_recoding[4]; xed_bits_t eamode[2][3]; xed_bits_t BRDISPz_BRDISP_WIDTH[4]; xed_bits_t MEMDISPv_DISP_WIDTH[4]; xed_bits_t SIMMz_IMM_WIDTH[4]; xed_bits_t UIMMv_IMM_WIDTH[4]; xed_bits_t ASZ_NONTERM_EASZ[2][3]; xed_bits_t OSZ_NONTERM_CR_WIDTH_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_DF64_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_DF64_FORCE64_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_DF64_IMMUNE66_LOOP64_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_FORCE64_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_IGNORE66_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_IMMUNE66_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_IMMUNE_REXW_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_REFINING66_CR_WIDTH_EOSZ[2][2][3]; xed_bits_t OSZ_NONTERM_REFINING66_EOSZ[2][2][3]; } kXed = { .vex_prefix_recoding = {0, 1, 3, 2}, .BRDISPz_BRDISP_WIDTH = {0, 16, 32, 32}, .MEMDISPv_DISP_WIDTH = {0, 16, 32, 64}, .SIMMz_IMM_WIDTH = {0x00, 0x10, 0x20, 0x20}, .UIMMv_IMM_WIDTH = {0x00, 0x10, 0x20, 0x40}, .ASZ_NONTERM_EASZ = { [0][0] = 0x1, [1][0] = 0x2, [0][1] = 0x2, [1][1] = 0x1, [0][2] = 0x3, [1][2] = 0x2, }, .OSZ_NONTERM_CR_WIDTH_EOSZ = { [0][0][0] = 0x2, [1][0][0] = 0x2, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x2, [1][1][1] = 0x2, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x3, [0][0][2] = 0x3, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_DF64_EOSZ = { [0][0][0] = 0x1, [1][0][0] = 0x1, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x1, [1][1][1] = 0x1, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x1, [0][0][2] = 0x3, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_DF64_FORCE64_EOSZ = { [0][0][0] = 0x1, [1][0][0] = 0x1, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x1, [1][1][1] = 0x1, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x3, [0][0][2] = 0x3, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_DF64_IMMUNE66_LOOP64_EOSZ = { [0][0][0] = 0x1, [1][0][0] = 0x1, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x1, [1][1][1] = 0x1, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x3, [0][0][2] = 0x3, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_EOSZ = { [0][0][0] = 0x1, [1][0][0] = 0x1, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x1, [1][1][1] = 0x1, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x1, [0][0][2] = 0x2, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_FORCE64_EOSZ = { [0][0][0] = 0x1, [1][0][0] = 0x1, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x1, [1][1][1] = 0x1, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x3, [0][0][2] = 0x3, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_IGNORE66_EOSZ = { [0][0][0] = 0x1, [1][0][0] = 0x1, [0][1][0] = 0x1, [1][1][0] = 0x1, [0][1][1] = 0x2, [1][1][1] = 0x2, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x2, [0][0][2] = 0x2, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_IMMUNE66_EOSZ = { [0][0][0] = 0x2, [1][0][0] = 0x2, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x2, [1][1][1] = 0x2, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x2, [0][0][2] = 0x2, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_IMMUNE_REXW_EOSZ = { [0][0][0] = 0x1, [1][0][0] = 0x1, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x1, [1][1][1] = 0x1, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x1, [0][0][2] = 0x2, [1][1][2] = 0x2, [1][0][2] = 0x2, }, .OSZ_NONTERM_REFINING66_CR_WIDTH_EOSZ = { [0][0][0] = 0x2, [1][0][0] = 0x2, [0][1][0] = 0x2, [1][1][0] = 0x2, [0][1][1] = 0x2, [1][1][1] = 0x2, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x3, [0][0][2] = 0x3, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .OSZ_NONTERM_REFINING66_EOSZ = { [0][0][0] = 0x1, [1][0][0] = 0x1, [0][1][0] = 0x1, [1][1][0] = 0x1, [0][1][1] = 0x2, [1][1][1] = 0x2, [0][0][1] = 0x2, [1][0][1] = 0x2, [0][1][2] = 0x2, [0][0][2] = 0x2, [1][1][2] = 0x3, [1][0][2] = 0x3, }, .eamode = { [0][XED_MODE_REAL] = XED_MODE_REAL, [0][XED_MODE_LEGACY] = XED_MODE_LEGACY, [0][XED_MODE_LONG] = XED_MODE_LONG, [1][XED_MODE_REAL] = XED_MODE_LEGACY, [1][XED_MODE_LEGACY] = XED_MODE_REAL, [1][XED_MODE_LONG] = XED_MODE_LEGACY, }, }; privileged static void xed_too_short(struct XedDecodedInst *d) { d->op.out_of_bytes = 1; if (d->op.max_bytes >= 15) { d->op.error = XED_ERROR_INSTR_TOO_LONG; } else { d->op.error = XED_ERROR_BUFFER_TOO_SHORT; } } privileged static void xed_bad_map(struct XedDecodedInst *d) { d->op.map = XED_ILD_MAP_INVALID; d->op.error = XED_ERROR_BAD_MAP; } privileged static void xed_bad_v4(struct XedDecodedInst *d) { d->op.error = XED_ERROR_BAD_EVEX_V_PRIME; } privileged static void xed_bad_z_aaa(struct XedDecodedInst *d) { d->op.error = XED_ERROR_BAD_EVEX_Z_NO_MASKING; } privileged static xed_bits_t xed_get_prefix_table_bit(xed_bits_t a) { return (xed_prefix_table_bit[a >> 5] >> (a & 0x1F)) & 1; } privileged static size_t xed_bits2bytes(unsigned bits) { return bits >> 3; } privileged static size_t xed_bytes2bits(unsigned bytes) { return bytes << 3; } privileged static bool xed3_mode_64b(struct XedDecodedInst *d) { return d->op.mode == XED_MODE_LONG; } privileged static void xed_set_hint(char b, struct XedDecodedInst *d) { switch (b) { case 0x2e: d->op.hint = XED_HINT_NTAKEN; return; case 0x3e: d->op.hint = XED_HINT_TAKEN; return; default: break; } } privileged static void XED_LF_SIMM8_IMM_WIDTH_CONST_l2( struct XedDecodedInst *x) { x->op.imm_width = 8; x->op.imm_signed = true; } privileged static void XED_LF_UIMM16_IMM_WIDTH_CONST_l2( struct XedDecodedInst *x) { x->op.imm_width = 16; } privileged static void XED_LF_SE_IMM8_IMM_WIDTH_CONST_l2( struct XedDecodedInst *x) { x->op.imm_width = 8; } privileged static void XED_LF_UIMM32_IMM_WIDTH_CONST_l2( struct XedDecodedInst *x) { x->op.imm_width = 32; } privileged static void xed_set_simmz_imm_width_eosz( struct XedDecodedInst *x, const xed_bits_t eosz[2][2][3]) { x->op.imm_width = kXed.SIMMz_IMM_WIDTH[eosz[x->op.rexw][x->op.osz][x->op.mode]]; x->op.imm_signed = true; } privileged static void xed_set_uimmv_imm_width_eosz( struct XedDecodedInst *x, const xed_bits_t eosz[2][2][3]) { x->op.imm_width = kXed.UIMMv_IMM_WIDTH[eosz[x->op.rexw][x->op.osz][x->op.mode]]; } privileged static void XED_LF_UIMM8_IMM_WIDTH_CONST_l2( struct XedDecodedInst *x) { x->op.imm_width = 8; } privileged static void XED_LF_0_IMM_WIDTH_CONST_l2(struct XedDecodedInst *x) { x->op.imm_width = 0; } privileged static void XED_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xc7_l1( struct XedDecodedInst *x) { switch (x->op.reg) { case 0: XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2(x); break; case 7: XED_LF_0_IMM_WIDTH_CONST_l2(x); break; default: break; } } privileged static void XED_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xf6_l1( struct XedDecodedInst *x) { if (x->op.reg <= 1) { XED_LF_SIMM8_IMM_WIDTH_CONST_l2(x); } else if (2 <= x->op.reg && x->op.reg <= 7) { XED_LF_0_IMM_WIDTH_CONST_l2(x); } } privileged static void XED_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xf7_l1( struct XedDecodedInst *x) { if (x->op.reg <= 1) { XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2(x); } else if (2 <= x->op.reg && x->op.reg <= 7) { XED_LF_0_IMM_WIDTH_CONST_l2(x); } } privileged static void xed_ild_hasimm_map0x0F_op0x78_l1( struct XedDecodedInst *x) { if (x->op.osz || x->op.ild_f2) { x->op.imm_width = xed_bytes2bits(1); x->op.imm1_bytes = 1; } } privileged static void xed_ild_hasimm_map0x0_op0xc8_l1( struct XedDecodedInst *x) { x->op.imm_width = xed_bytes2bits(2); x->op.imm1_bytes = 1; } privileged static void xed_set_imm_bytes(struct XedDecodedInst *d) { if (!d->op.imm_width && d->op.map < XED_ILD_MAP2) { switch (xed_imm_bits_2d[d->op.map][d->op.opcode]) { case XED_I_LF_0_IMM_WIDTH_CONST_l2: XED_LF_0_IMM_WIDTH_CONST_l2(d); break; case XED_I_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xc7_l1: XED_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xc7_l1(d); break; case XED_I_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xf6_l1: XED_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xf6_l1(d); break; case XED_I_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xf7_l1: XED_LF_RESOLVE_BYREG_IMM_WIDTH_map0x0_op0xf7_l1(d); break; case XED_I_LF_SIMM8_IMM_WIDTH_CONST_l2: XED_LF_SIMM8_IMM_WIDTH_CONST_l2(d); break; case XED_I_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_DF64_EOSZ_l2: XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_DF64_EOSZ_l2(d); break; case XED_I_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2: XED_LF_SIMMz_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2(d); break; case XED_I_LF_UIMM16_IMM_WIDTH_CONST_l2: XED_LF_UIMM16_IMM_WIDTH_CONST_l2(d); break; case XED_I_LF_UIMM8_IMM_WIDTH_CONST_l2: XED_LF_UIMM8_IMM_WIDTH_CONST_l2(d); break; case XED_I_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2: XED_LF_UIMMv_IMM_WIDTH_OSZ_NONTERM_EOSZ_l2(d); break; case xed_i_ild_hasimm_map0x0_op0xc8_l1: xed_ild_hasimm_map0x0_op0xc8_l1(d); break; case xed_i_ild_hasimm_map0x0F_op0x78_l1: xed_ild_hasimm_map0x0F_op0x78_l1(d); break; default: d->op.error = XED_ERROR_GENERAL_ERROR; return; } } } privileged static int xed_consume_byte(struct XedDecodedInst *d) { if (d->length < d->op.max_bytes) { return d->bytes[d->length++]; } else { xed_too_short(d); return -1; } } privileged static void xed_prefix_scanner(struct XedDecodedInst *d) { xed_bits_t first_f2f3, last_f2f3, seg; xed_bits_t b, max_bytes, length, nprefixes, nseg_prefixes, nrexes, rex; seg = 0; length = d->length; max_bytes = d->op.max_bytes; first_f2f3 = last_f2f3 = rex = nrexes = nprefixes = nseg_prefixes = 0; while (length < max_bytes) { b = d->bytes[length]; if (xed_get_prefix_table_bit(b) == 0) goto out; switch (b) { case 0x66: d->op.osz = true; rex = 0; break; case 0x67: d->op.asz = true; rex = 0; break; case 0x2E: case 0x3E: xed_set_hint(b, d); /* fallthrough */ case 0x26: case 0x36: if (!xed3_mode_64b(d)) seg = b; nseg_prefixes++; rex = 0; break; case 0x64: case 0x65: seg = b; nseg_prefixes++; rex = 0; break; case 0xF0: d->op.lock = true; rex = 0; break; case 0xF3: d->op.ild_f3 = true; last_f2f3 = 3; if (!first_f2f3) { first_f2f3 = 3; } rex = 0; break; case 0xF2: d->op.ild_f2 = true; last_f2f3 = 2; if (!first_f2f3) { first_f2f3 = 2; } rex = 0; break; default: if (xed3_mode_64b(d) && (b & 0xf0) == 0x40) { nrexes++; rex = b; break; } else { goto out; } } length++; nprefixes++; } out: d->length = length; d->op.nprefixes = nprefixes; d->op.nseg_prefixes = nseg_prefixes; d->op.nrexes = nrexes; if (rex) { d->op.rexw = rex >> 3 & 1; d->op.rexr = rex >> 2 & 1; d->op.rexx = rex >> 1 & 1; d->op.rexb = rex & 1; d->op.rex = true; } if (d->op.mode_first_prefix) { d->op.rep = first_f2f3; } else { d->op.rep = last_f2f3; } switch (seg) { case 0x26: /* ES */ d->op.seg_ovd = 0 + 1; break; case 0x2e: /* CS */ d->op.seg_ovd = 1 + 1; break; case 0x36: /* SS */ d->op.seg_ovd = 2 + 1; break; case 0x3e: /* DS */ d->op.seg_ovd = 3 + 1; break; case 0x64: /* FS */ d->op.seg_ovd = 4 + 1; break; case 0x65: /* GS */ d->op.seg_ovd = 5 + 1; break; default: break; } if (length >= max_bytes) { xed_too_short(d); return; } } privileged static void xed_get_next_as_opcode(struct XedDecodedInst *d) { xed_bits_t b, length; length = d->length; if (length < d->op.max_bytes) { b = d->bytes[length]; d->op.opcode = b; d->length++; /* d->op.srm = xed_modrm_rm(b); */ } else { xed_too_short(d); } } privileged static void xed_catch_invalid_rex_or_legacy_prefixes( struct XedDecodedInst *d) { if (xed3_mode_64b(d) && d->op.rex) { d->op.error = XED_ERROR_BAD_REX_PREFIX; } else if (d->op.osz || d->op.ild_f3 || d->op.ild_f2) { d->op.error = XED_ERROR_BAD_LEGACY_PREFIX; } } privileged static void xed_catch_invalid_mode(struct XedDecodedInst *d) { if (d->op.realmode) { d->op.error = XED_ERROR_INVALID_MODE; } } privileged static void xed_evex_vex_opcode_scanner(struct XedDecodedInst *d) { d->op.opcode = d->bytes[d->length]; d->op.pos_opcode = d->length++; xed_catch_invalid_rex_or_legacy_prefixes(d); xed_catch_invalid_mode(d); } privileged static void xed_opcode_scanner(struct XedDecodedInst *d) { xed_bits_t b, length; length = d->length; if ((b = d->bytes[length]) != 0x0F) { d->op.map = XED_ILD_MAP0; d->op.opcode = b; d->op.pos_opcode = length; d->length++; } else { length++; d->op.pos_opcode = length; if (length < d->op.max_bytes) { switch ((b = d->bytes[length])) { case 0x38: length++; d->op.map = XED_ILD_MAP2; d->length = length; xed_get_next_as_opcode(d); return; case 0x3A: length++; d->op.map = XED_ILD_MAP3; d->length = length; d->op.imm_width = xed_bytes2bits(1); xed_get_next_as_opcode(d); return; case 0x3B: length++; xed_bad_map(d); d->length = length; xed_get_next_as_opcode(d); return; case 0x39: case 0x3C: case 0x3D: case 0x3E: case 0x3F: length++; xed_bad_map(d); d->length = length; xed_get_next_as_opcode(d); return; case 0x0F: d->op.amd3dnow = true; length++; d->op.opcode = 0x0F; d->op.map = XED_ILD_MAPAMD; d->length = length; break; default: length++; d->op.opcode = b; d->op.map = XED_ILD_MAP1; d->length = length; break; } } else { xed_too_short(d); return; } } /* d->op.srm = xed_modrm_rm(d->op.opcode); */ } privileged static bool xed_is_bound_instruction(struct XedDecodedInst *d) { return !xed3_mode_64b(d) && d->length + 1 < d->op.max_bytes && (d->bytes[d->length + 1] & 0xC0) != 0xC0; } privileged static void xed_evex_scanner(struct XedDecodedInst *d) { xed_bits_t length, max_bytes; union XedAvx512Payload1 evex1; union XedAvx512Payload2 evex2; union XedAvx512Payload3 evex3; length = d->length; max_bytes = d->op.max_bytes; /* @assume prefix_scanner() checked length */ if (d->bytes[length] != 0x62) return; if (xed_is_bound_instruction(d)) return; if (length + 4 < max_bytes) { evex1.u32 = d->bytes[length + 1]; evex2.u32 = d->bytes[length + 2]; if (xed3_mode_64b(d)) { d->op.rexr = ~evex1.s.r_inv & 1; d->op.rexx = ~evex1.s.x_inv & 1; d->op.rexb = ~evex1.s.b_inv & 1; d->op.rexrr = ~evex1.s.rr_inv & 1; } d->op.rexw = evex2.s.rexw & 1; d->op.map = evex1.s.map; d->op.vexdest3 = evex2.s.vexdest3; d->op.vexdest210 = evex2.s.vexdest210; d->op.ubit = evex2.s.ubit; if (evex2.s.ubit) { d->op.vexvalid = 2; } else { d->op.error = XED_ERROR_BAD_EVEX_UBIT; } d->op.vex_prefix = kXed.vex_prefix_recoding[evex2.s.pp]; if (evex1.s.map == XED_ILD_MAP3) { d->op.imm_width = xed_bytes2bits(1); } if (evex2.s.ubit) { evex3.u32 = d->bytes[length + 3]; d->op.zeroing = evex3.s.z; d->op.llrc = evex3.s.llrc; d->op.vl = evex3.s.llrc; d->op.bcrc = evex3.s.bcrc; d->op.vexdest4 = ~evex3.s.vexdest4p & 1; if (!xed3_mode_64b(d) && evex3.s.vexdest4p == 0) { xed_bad_v4(d); } d->op.mask = evex3.s.mask; if (evex3.s.mask == 0 && evex3.s.z == 1) { xed_bad_z_aaa(d); } } length += 4; d->length = length; xed_evex_vex_opcode_scanner(d); } else { xed_too_short(d); } } privileged static uint64_t xed_read_number(uint8_t *p, size_t n, bool s) { switch (s << 2 | bsr(n)) { case 0b000: return *p; case 0b100: return (int8_t)*p; case 0b001: return READ16LE(p); case 0b101: return (int16_t)READ16LE(p); case 0b010: return READ32LE(p); case 0b110: return (int32_t)READ32LE(p); case 0b011: case 0b111: return READ64LE(p); default: unreachable; } } privileged static void xed_evex_imm_scanner(struct XedDecodedInst *d) { uint64_t uimm0; uint8_t *itext, *imm_ptr; xed_bits_t length, imm_bytes, imm1_bytes, max_bytes; imm_ptr = 0; itext = d->bytes; xed_set_imm_bytes(d); length = d->length; max_bytes = d->op.max_bytes; if (d->op.amd3dnow) { if (length < max_bytes) { d->op.opcode = d->bytes[length]; d->length++; return; } else { xed_too_short(d); return; } } imm_bytes = xed_bits2bytes(d->op.imm_width); imm1_bytes = d->op.imm1_bytes; if (imm_bytes) { if (length + imm_bytes <= max_bytes) { d->op.pos_imm = length; length += imm_bytes; d->length = length; if (imm1_bytes) { if (length + imm1_bytes <= max_bytes) { d->op.pos_imm1 = length; imm_ptr = itext + length; length += imm1_bytes; d->length = length; d->op.uimm1 = *imm_ptr; } else { xed_too_short(d); return; } } } else { xed_too_short(d); return; } } if (imm_bytes) { d->op.uimm0 = xed_read_number(itext + d->op.pos_imm, imm_bytes, d->op.imm_signed); } } privileged static void xed_vex_c4_scanner(struct XedDecodedInst *d) { uint8_t n; xed_bits_t length, max_bytes; union XedAvxC4Payload1 c4byte1; union XedAvxC4Payload2 c4byte2; if (xed_is_bound_instruction(d)) return; length = d->length; max_bytes = d->op.max_bytes; length++; if (length + 2 < max_bytes) { c4byte1.u32 = d->bytes[length]; c4byte2.u32 = d->bytes[length + 1]; d->op.rexr = ~c4byte1.s.r_inv & 1; d->op.rexx = ~c4byte1.s.x_inv & 1; d->op.rexb = (xed3_mode_64b(d) & ~c4byte1.s.b_inv) & 1; d->op.rexw = c4byte2.s.w & 1; d->op.vexdest3 = c4byte2.s.v3; d->op.vexdest210 = c4byte2.s.vvv210; d->op.vl = c4byte2.s.l; d->op.vex_prefix = kXed.vex_prefix_recoding[c4byte2.s.pp]; d->op.map = c4byte1.s.map; if ((c4byte1.s.map & 0x3) == XED_ILD_MAP3) { d->op.imm_width = xed_bytes2bits(1); } d->op.vexvalid = 1; length += 2; d->length = length; xed_evex_vex_opcode_scanner(d); } else { d->length = length; xed_too_short(d); } } privileged static void xed_vex_c5_scanner(struct XedDecodedInst *d) { xed_bits_t max_bytes, length; union XedAvxC5Payload c5byte1; length = d->length; max_bytes = d->op.max_bytes; if (xed_is_bound_instruction(d)) return; length++; if (length + 1 < max_bytes) { c5byte1.u32 = d->bytes[length]; d->op.rexr = ~c5byte1.s.r_inv & 1; d->op.vexdest3 = c5byte1.s.v3; d->op.vexdest210 = c5byte1.s.vvv210; d->op.vl = c5byte1.s.l; d->op.vex_prefix = kXed.vex_prefix_recoding[c5byte1.s.pp]; d->op.map = XED_ILD_MAP1; d->op.vexvalid = 1; length++; d->length = length; xed_evex_vex_opcode_scanner(d); } else { d->length = length; xed_too_short(d); } } privileged static void xed_vex_scanner(struct XedDecodedInst *d) { if (!d->op.out_of_bytes) { switch (d->bytes[d->length]) { case 0xC5: xed_vex_c5_scanner(d); break; case 0xC4: xed_vex_c4_scanner(d); break; default: break; } } } privileged static void xed_bad_ll(struct XedDecodedInst *d) { d->op.error = XED_ERROR_BAD_EVEX_LL; } privileged static void xed_bad_ll_check(struct XedDecodedInst *d) { if (d->op.llrc == 3) { if (d->op.mod != 3) { xed_bad_ll(d); } else if (d->op.bcrc == 0) { xed_bad_ll(d); } } } privileged static void xed_set_has_modrm(struct XedDecodedInst *d) { if (d->op.map < ARRAYLEN(xed_has_modrm_2d)) { d->op.has_modrm = xed_has_modrm_2d[d->op.map][d->op.opcode]; } else { d->op.has_modrm = 1; } } privileged static void xed_modrm_scanner(struct XedDecodedInst *d) { uint8_t b; xed_bits_t eamode, mod, rm, asz, mode, length, has_modrm; xed_set_has_modrm(d); has_modrm = d->op.has_modrm; if (has_modrm) { length = d->length; if (length < d->op.max_bytes) { b = d->bytes[length]; d->op.modrm = b; d->op.pos_modrm = length; d->length++; mod = xed_modrm_mod(b); rm = xed_modrm_rm(b); d->op.mod = mod; d->op.rm = rm; d->op.reg = xed_modrm_reg(b); xed_bad_ll_check(d); if (has_modrm != XED_ILD_HASMODRM_IGNORE_MOD) { asz = d->op.asz; mode = d->op.mode; eamode = kXed.eamode[asz][mode]; d->op.disp_width = xed_bytes2bits(xed_has_disp_regular[eamode][mod][rm]); d->op.has_sib = xed_has_sib_table[eamode][mod][rm]; } } else { xed_too_short(d); } } } privileged static void xed_sib_scanner(struct XedDecodedInst *d) { uint8_t b; xed_bits_t length; if (d->op.has_sib) { length = d->length; if (length < d->op.max_bytes) { b = d->bytes[length]; d->op.pos_sib = length; d->op.sib = b; d->length++; if (xed_sib_base(b) == 5) { if (d->op.mod == 0) { d->op.disp_width = xed_bytes2bits(4); } } } else { xed_too_short(d); } } } privileged static void XED_LF_EMPTY_DISP_CONST_l2(struct XedDecodedInst *x) { /* This function does nothing for map-opcodes whose * disp_bytes value is set earlier in xed-ild.c * (regular displacement resolution by modrm/sib)*/ (void)x; } privileged static void XED_LF_BRDISP8_BRDISP_WIDTH_CONST_l2( struct XedDecodedInst *x) { x->op.disp_width = 0x8; } privileged static void XED_LF_BRDISPz_BRDISP_WIDTH_OSZ_NONTERM_EOSZ_l2( struct XedDecodedInst *x) { x->op.disp_width = kXed.BRDISPz_BRDISP_WIDTH[kXed.OSZ_NONTERM_EOSZ[x->op.rexw][x->op.osz] [x->op.mode]]; x->op.disp_unsigned = true; } privileged static void XED_LF_RESOLVE_BYREG_DISP_map0x0_op0xc7_l1( struct XedDecodedInst *x) { switch (x->op.reg) { case 0: XED_LF_EMPTY_DISP_CONST_l2(x); break; case 7: XED_LF_BRDISPz_BRDISP_WIDTH_OSZ_NONTERM_EOSZ_l2(x); break; default: break; } } privileged static void XED_LF_MEMDISPv_DISP_WIDTH_ASZ_NONTERM_EASZ_l2( struct XedDecodedInst *x) { x->op.disp_width = kXed.MEMDISPv_DISP_WIDTH[kXed.ASZ_NONTERM_EASZ[x->op.asz][x->op.mode]]; x->op.disp_unsigned = true; } privileged static void XED_LF_BRDISP32_BRDISP_WIDTH_CONST_l2( struct XedDecodedInst *x) { x->op.disp_width = 0x20; } privileged static void XED_LF_DISP_BUCKET_0_l1(struct XedDecodedInst *x) { if (x->op.mode <= XED_MODE_LEGACY) { XED_LF_BRDISPz_BRDISP_WIDTH_OSZ_NONTERM_EOSZ_l2(x); x->op.disp_unsigned = false; } else if (x->op.mode == XED_MODE_LONG) { XED_LF_BRDISP32_BRDISP_WIDTH_CONST_l2(x); } } privileged static void xed_disp_scanner(struct XedDecodedInst *d) { xed_bits_t length, disp_width, disp_bytes, max_bytes; length = d->length; if (d->op.map < XED_ILD_MAP2) { switch (xed_disp_bits_2d[d->op.map][d->op.opcode]) { case XED_I_LF_BRDISP8_BRDISP_WIDTH_CONST_l2: XED_LF_BRDISP8_BRDISP_WIDTH_CONST_l2(d); break; case XED_I_LF_BRDISPz_BRDISP_WIDTH_OSZ_NONTERM_EOSZ_l2: XED_LF_BRDISPz_BRDISP_WIDTH_OSZ_NONTERM_EOSZ_l2(d); break; case XED_I_LF_DISP_BUCKET_0_l1: XED_LF_DISP_BUCKET_0_l1(d); break; case XED_I_LF_EMPTY_DISP_CONST_l2: XED_LF_EMPTY_DISP_CONST_l2(d); break; case XED_I_LF_MEMDISPv_DISP_WIDTH_ASZ_NONTERM_EASZ_l2: XED_LF_MEMDISPv_DISP_WIDTH_ASZ_NONTERM_EASZ_l2(d); break; case XED_I_LF_RESOLVE_BYREG_DISP_map0x0_op0xc7_l1: XED_LF_RESOLVE_BYREG_DISP_map0x0_op0xc7_l1(d); break; default: d->op.error = XED_ERROR_GENERAL_ERROR; return; } } disp_bytes = xed_bits2bytes(d->op.disp_width); if (disp_bytes) { max_bytes = d->op.max_bytes; if (length + disp_bytes <= max_bytes) { d->op.disp = xed_read_number(d->bytes + length, disp_bytes, !d->op.disp_unsigned); d->op.pos_disp = length; d->length = length + disp_bytes; } else { xed_too_short(d); } } } privileged static void xed_decode_instruction_length( struct XedDecodedInst *ild) { xed_prefix_scanner(ild); if (!ild->op.out_of_bytes) { xed_vex_scanner(ild); if (!ild->op.out_of_bytes) { if (!ild->op.vexvalid) xed_evex_scanner(ild); if (!ild->op.out_of_bytes) { if (!ild->op.vexvalid && !ild->op.error) { xed_opcode_scanner(ild); } xed_modrm_scanner(ild); xed_sib_scanner(ild); xed_disp_scanner(ild); xed_evex_imm_scanner(ild); } } } } privileged static void xed_encode_rde(struct XedDecodedInst *x) { const uint8_t kWordLog2[2][2][2] = {{{2, 3}, {1, 3}}, {{0, 0}, {0, 0}}}; uint32_t osz = x->op.osz ^ x->op.realmode; x->op.rde = kWordLog2[~x->op.opcode & 1][osz][x->op.rexw] << 28 | x->op.mode << 26 | kXed.eamode[x->op.asz][x->op.mode] << 24 | x->op.rep << 30 | x->op.mod << 22 | x->op.asz << 17 | x->op.seg_ovd << 18 | x->op.rexw << 6 | osz << 5 | (x->op.rex << 4 | x->op.rexb << 3 | x->op.srm) << 12 | (x->op.rex << 4 | x->op.rexb << 3 | x->op.rm) << 7 | (x->op.rex << 4 | x->op.rexr << 3 | x->op.reg); } /** * Clears instruction decoder state. */ privileged struct XedDecodedInst *xed_decoded_inst_zero_set_mode( struct XedDecodedInst *p, enum XedMachineMode mmode) { __builtin_memset(p, 0, sizeof(*p)); xed_operands_set_mode(&p->op, mmode); return p; } /** * Decodes machine instruction length. * * This function also decodes other useful attributes, such as the * offsets of displacement, immediates, etc. It works for all ISAs from * 1977 to 2020. * * @note binary footprint increases ~4kb if this is used * @see biggest code in gdb/clang/tensorflow binaries */ privileged enum XedError xed_instruction_length_decode( struct XedDecodedInst *xedd, const void *itext, size_t bytes) { __builtin_memcpy(xedd->bytes, itext, MIN(15, bytes)); xedd->op.max_bytes = MIN(15, bytes); xed_decode_instruction_length(xedd); xed_encode_rde(xedd); if (!xedd->op.out_of_bytes) { if (xedd->op.map != XED_ILD_MAP_INVALID) { return xedd->op.error; } else { return XED_ERROR_GENERAL_ERROR; } } else { return XED_ERROR_BUFFER_TOO_SHORT; } }