#ifndef _BX_DISASM_H_ #define _BX_DISASM_H_ #include "config.h" #define BX_DECODE_MODRM(modrm_byte, mod, opcode, rm) { \ mod = (modrm_byte >> 6) & 0x03; \ opcode = (modrm_byte >> 3) & 0x07; \ rm = modrm_byte & 0x07; \ } #define BX_DECODE_SIB(sib_byte, scale, index, base) { \ scale = sib >> 6; \ index = (sib >> 3) & 0x07; \ base = sib & 0x07; \ } // will be used in future #define IA_8086 0x00000000 /* 8086 instruction */ #define IA_286 0x00000000 /* 286+ instruction */ #define IA_386 0x00000000 /* 386+ instruction */ #define IA_FPU 0x00000000 #define IA_486 0x00000000 /* 486+ instruction */ #define IA_PENTIUM 0x00000000 /* Pentium instruction */ #define IA_P6 0x00000000 /* P6 instruction */ #define IA_KATMAI 0x00000000 /* Katmai instruction */ #define IA_WILLAMETTE 0x00000000 /* Willamette instruction */ #define IA_PRESCOTT 0x00000000 /* Prescott instruction */ #define IA_X86_64 0x00000000 /* x86-64 specific instruction */ #define IF_ARITHMETIC 0x00000000 /* arithmetic instruction */ #define IF_LOGIC 0x00000000 /* logic instruction */ #define IF_SYSTEM 0x00000000 /* system instruction (require CPL=0) */ #define IF_BRANCH 0x00000000 /* branch instruction */ #define IF_FPU 0x00000000 /* FPU instruction */ #define IF_MMX 0x00000000 /* MMX instruction */ #define IF_3DNOW 0x00000000 /* 3DNow! instruction */ #define IF_KNI 0x00000000 /* Katmai new instruction */ #define IF_PREFETCH 0x00000000 /* Prefetch instruction */ #define IF_SSE 0x00000000 /* SSE instruction */ #define IF_SSE2 0x00000000 /* SSE2 instruction */ #define IF_PNI 0x00000000 /* Prescott new instruction */ enum { AL_REG, CL_REG, DL_REG, BL_REG, AH_REG, CH_REG, DH_REG, BH_REG }; enum { AX_REG, CX_REG, DX_REG, BX_REG, SP_REG, BP_REG, SI_REG, DI_REG }; enum { eAX_REG, eCX_REG, eDX_REG, eBX_REG, eSP_REG, eBP_REG, eSI_REG, eDI_REG }; #if BX_DISASM_SUPPORT_X86_64 enum { rAX_REG, rCX_REG, rDX_REG, rBX_REG, rSP_REG, rBP_REG, rSI_REG, rDI_REG }; #endif enum { ES_REG, CS_REG, SS_REG, DS_REG, FS_REG, GS_REG }; class disassembler; typedef void (disassembler::*BxDisasmPtr_t) (unsigned attr); typedef void (disassembler::*BxDisasmResolveModrmPtr_t) (unsigned attr); struct BxDisasmOpcodeInfo_t { const char *Opcode; unsigned Attr; BxDisasmPtr_t Operand1; unsigned Op1Attr; BxDisasmPtr_t Operand2; unsigned Op2Attr; BxDisasmPtr_t Operand3; unsigned Op3Attr; struct BxDisasmOpcodeInfo_t *AnotherArray; }; // datasize attributes #define X_SIZE 0x0000 #define B_SIZE 0x0100 #define W_SIZE 0x0200 #define D_SIZE 0x0300 #define V_SIZE 0x0400 #define Q_SIZE 0x0500 #define Z_SIZE 0x0600 #define O_SIZE 0x0700 #define T_SIZE 0x0800 #define P_SIZE 0x0900 #define S_SIZE 0x0A00 // branch hint attribute #define BRANCH_HINT 0x1000 class disassembler { public: disassembler() { set_syntax_intel(); } unsigned disasm(bx_bool is_32, bx_address base, bx_address ip, Bit8u *instr, char *disbuf); void set_syntax_intel(); void set_syntax_att (); private: bx_bool intel_mode; const char **general_16bit_regname; const char **general_8bit_regname; const char **general_32bit_regname; #if BX_DISASM_SUPPORT_X86_64 const char **general_8bit_regname_rex; const char **general_64bit_regname; #endif const char **segment_name; const char **index16; const char *sreg_mod01or10_rm32[8]; const char *sreg_mod00_base32[8]; const char *sreg_mod01or10_base32[8]; const char *sreg_mod00_rm16[8]; const char *sreg_mod01or10_rm16[8]; private: bx_bool os_32; bx_bool as_32; #if BX_DISASM_SUPPORT_X86_64 bx_bool os_64; bx_bool as_64; #endif Bit8u modrm, mod, nnn, rm; Bit8u sib, scale, sib_index, sib_base; union { Bit16u displ16; Bit32u displ32; } displacement; bx_address db_eip, db_base; unsigned n_prefixes; Bit8u *instruction; // for fetching of next byte of instruction const char *seg_override; char *disbufptr; BxDisasmResolveModrmPtr_t resolve_modrm; BX_CPP_INLINE Bit8u fetch_byte() { db_eip++; return(*instruction++); }; BX_CPP_INLINE Bit8u peek_byte() { return(*instruction); }; BX_CPP_INLINE Bit16u fetch_word() { Bit8u b0 = * (Bit8u *) instruction++; Bit8u b1 = * (Bit8u *) instruction++; Bit16u ret16 = (b1<<8) | b0; db_eip += 2; return(ret16); }; BX_CPP_INLINE Bit32u fetch_dword() { Bit8u b0 = * (Bit8u *) instruction++; Bit8u b1 = * (Bit8u *) instruction++; Bit8u b2 = * (Bit8u *) instruction++; Bit8u b3 = * (Bit8u *) instruction++; Bit32u ret32 = (b3<<24) | (b2<<16) | (b1<<8) | b0; db_eip += 4; return(ret32); }; #if BX_DISASM_SUPPORT_X86_64 BX_CPP_INLINE Bit64u fetch_qword() { Bit64u d0 = fetch_dword(); Bit64u d1 = fetch_dword(); Bit64u ret64 = (d1<<32) | d0; return(ret64); }; #endif void dis_putc(char symbol); void dis_sprintf(char *fmt, ...); void decode_modrm(); void resolve16_mod0 (unsigned mode); void resolve16_mod1or2 (unsigned mode); void resolve32_mod0 (unsigned mode); void resolve32_mod1or2 (unsigned mode); void resolve32_mod0_rm4 (unsigned mode); void resolve32_mod1or2_rm4 (unsigned mode); void initialize_modrm_segregs(); void print_datasize (unsigned mode); void print_memory_access16(int datasize, const char *seg, const char *index, Bit16u disp); void print_memory_access32(int datasize, const char *seg, const char *base, const char *index, int scale, Bit32u disp); void print_disassembly_intel(const BxDisasmOpcodeInfo_t *entry); void print_disassembly_att (const BxDisasmOpcodeInfo_t *entry); public: /* * Codes for Addressing Method: * --------------------------- * A - Direct address. The instruction has no ModR/M byte; the address * of the operand is encoded in the instruction; and no base register, * index register, or scaling factor can be applied. * C - The reg field of the ModR/M byte selects a control register. * D - The reg field of the ModR/M byte selects a debug register. * E - A ModR/M byte follows the opcode and specifies the operand. The * operand is either a general-purpose register or a memory address. * If it is a memory address, the address is computed from a segment * register and any of the following values: a base register, an * index register, a scaling factor, a displacement. * F - Flags Register. * G - The reg field of the ModR/M byte selects a general register. * I - Immediate data. The operand value is encoded in subsequent bytes of * the instruction. * J - The instruction contains a relative offset to be added to the * instruction pointer register. * M - The ModR/M byte may refer only to memory. * O - The instruction has no ModR/M byte; the offset of the operand is * coded as a word or double word (depending on address size attribute) * in the instruction. No base register, index register, or scaling * factor can be applied. * P - The reg field of the ModR/M byte selects a packed quadword MMX * technology register. * Q - A ModR/M byte follows the opcode and specifies the operand. The * operand is either an MMX technology register or a memory address. * If it is a memory address, the address is computed from a segment * register and any of the following values: a base register, an * index register, a scaling factor, and a displacement. * R - The mod field of the ModR/M byte may refer only to a general register. * S - The reg field of the ModR/M byte selects a segment register. * T - The reg field of the ModR/M byte selects a test register. * V - The reg field of the ModR/M byte selects a 128-bit XMM register. * W - A ModR/M byte follows the opcode and specifies the operand. The * operand is either a 128-bit XMM register or a memory address. If * it is a memory address, the address is computed from a segment * register and any of the following values: a base register, an * index register, a scaling factor, and a displacement. * X - Memory addressed by the DS:rSI register pair. * Y - Memory addressed by the ES:rDI register pair. */ /* * Codes for Operand Type: * ---------------------- * a - Two one-word operands in memory or two double-word operands in * memory, depending on operand-size attribute (used only by the BOUND * instruction). * b - Byte, regardless of operand-size attribute. * d - Doubleword, regardless of operand-size attribute. * dq - Double-quadword, regardless of operand-size attribute. * p - 32-bit or 48-bit pointer, depending on operand-size attribute. * pd - 128-bit packed double-precision floating-point data. * pi - Quadword MMX technology register (packed integer) * ps - 128-bit packed single-precision floating-point data. * q - Quadword, regardless of operand-size attribute. * s - 6-byte or 10-byte pseudo-descriptor. * si - Doubleword integer register (scalar integer) * ss - Scalar element of a 128-bit packed single-precision floating data. * sd - Scalar element of a 128-bit packed double-precision floating data. * v - Word, doubleword or quadword, depending on operand-size attribute. * w - Word, regardless of operand-size attribute. * z - A word if the effective operand size is 16 bits, or a doubleword * if the effective operand size is 32 or 64 bits. */ // fpu void ST0 (unsigned attribute); void STj (unsigned attribute); // general/segment register void Rw (unsigned attribute); void Rd (unsigned attribute); void Sw (unsigned attribute); // control/debug register void Cd (unsigned attribute); void Dd (unsigned attribute); void Td (unsigned attribute); // segment register void OP_SEG (unsigned attribute); // memory only void OP_MEM (unsigned attribute); // general purpose register void REG16 (unsigned attribute); void REG8 (unsigned attribute); void REG32 (unsigned attribute); // string instructions void OP_X (unsigned attribute); void OP_Y (unsigned attribute); // mmx/xmm void OP_P (unsigned attribute); void OP_Q (unsigned attribute); void OP_W (unsigned attribute); void OP_V (unsigned attribute); // mov void OP_O (unsigned attribute); // immediate void sIb (unsigned attribute); void I1 (unsigned attribute); void Ib (unsigned attribute); void Iw (unsigned attribute); void Id (unsigned attribute); void Iv (unsigned attribute); #if BX_DISASM_SUPPORT_X86_64 void Iz (unsigned attribute); void Iq (unsigned attribute); #endif // general purpose register or memory void Eb (unsigned attribute); void Ew (unsigned attribute); void Ed (unsigned attribute); void Ev (unsigned attribute); // general purpose register void Gb (unsigned attribute); void Gv (unsigned attribute); void Gd (unsigned attribute); // call/jump void Jb (unsigned attribute); void Jv (unsigned attribute); // call/jmp far void Ap (unsigned attribute); }; #endif