| #include "ia32_modrm.h" |
| #include "ia32_reg.h" |
| #include "x86_imm.h" |
| |
| /* NOTE: when decoding ModR/M and SIB, we have to add 1 to all register |
| * values obtained from decoding the ModR/M or SIB byte, since they |
| * are encoded with eAX = 0 and the tables in ia32_reg.c use eAX = 1. |
| * ADDENDUM: this is only the case when the register value is used |
| * directly as an index into the register table, not when it is added to |
| * a genregs offset. */ |
| |
| /* -------------------------------- ModR/M, SIB */ |
| /* ModR/M flags */ |
| #define MODRM_RM_SIB 0x04 /* R/M == 100 */ |
| #define MODRM_RM_NOREG 0x05 /* R/B == 101 */ |
| |
| /* if (MODRM.MOD_NODISP && MODRM.RM_NOREG) then just disp32 */ |
| #define MODRM_MOD_NODISP 0x00 /* mod == 00 */ |
| #define MODRM_MOD_DISP8 0x01 /* mod == 01 */ |
| #define MODRM_MOD_DISP32 0x02 /* mod == 10 */ |
| #define MODRM_MOD_NOEA 0x03 /* mod == 11 */ |
| |
| /* 16-bit modrm flags */ |
| #define MOD16_MOD_NODISP 0 |
| #define MOD16_MOD_DISP8 1 |
| #define MOD16_MOD_DISP16 2 |
| #define MOD16_MOD_REG 3 |
| |
| #define MOD16_RM_BXSI 0 |
| #define MOD16_RM_BXDI 1 |
| #define MOD16_RM_BPSI 2 |
| #define MOD16_RM_BPDI 3 |
| #define MOD16_RM_SI 4 |
| #define MOD16_RM_DI 5 |
| #define MOD16_RM_BP 6 |
| #define MOD16_RM_BX 7 |
| |
| /* SIB flags */ |
| #define SIB_INDEX_NONE 0x04 |
| #define SIB_BASE_EBP 0x05 |
| #define SIB_SCALE_NOBASE 0x00 |
| |
| /* Convenience struct for modR/M bitfield */ |
| struct modRM_byte { |
| unsigned int mod : 2; |
| unsigned int reg : 3; |
| unsigned int rm : 3; |
| }; |
| |
| /* Convenience struct for SIB bitfield */ |
| struct SIB_byte { |
| unsigned int scale : 2; |
| unsigned int index : 3; |
| unsigned int base : 3; |
| }; |
| |
| |
| #if 0 |
| int modrm_rm[] = {0,1,2,3,MODRM_RM_SIB,MODRM_MOD_DISP32,6,7}; |
| int modrm_reg[] = {0, 1, 2, 3, 4, 5, 6, 7}; |
| int modrm_mod[] = {0, MODRM_MOD_DISP8, MODRM_MOD_DISP32, MODRM_MOD_NOEA}; |
| int sib_scl[] = {0, 2, 4, 8}; |
| int sib_idx[] = {0, 1, 2, 3, SIB_INDEX_NONE, 5, 6, 7 }; |
| int sib_bas[] = {0, 1, 2, 3, 4, SIB_SCALE_NOBASE, 6, 7 }; |
| #endif |
| |
| /* this is needed to replace x86_imm_signsized() which does not sign-extend |
| * to dest */ |
| static unsigned int imm32_signsized( unsigned char *buf, size_t buf_len, |
| int32_t *dest, unsigned int size ) { |
| if ( size > buf_len ) { |
| return 0; |
| } |
| |
| switch (size) { |
| case 1: |
| *dest = *((signed char *) buf); |
| break; |
| case 2: |
| *dest = *((signed short *) buf); |
| break; |
| case 4: |
| default: |
| *dest = *((signed int *) buf); |
| break; |
| } |
| |
| return size; |
| } |
| |
| |
| |
| static void byte_decode(unsigned char b, struct modRM_byte *modrm) { |
| /* generic bitfield-packing routine */ |
| |
| modrm->mod = b >> 6; /* top 2 bits */ |
| modrm->reg = (b & 56) >> 3; /* middle 3 bits */ |
| modrm->rm = b & 7; /* bottom 3 bits */ |
| } |
| |
| |
| static size_t sib_decode( unsigned char *buf, size_t buf_len, x86_ea_t *ea, |
| unsigned int mod ) { |
| /* set Address Expression fields (scale, index, base, disp) |
| * according to the contents of the SIB byte. |
| * b points to the SIB byte in the instruction-stream buffer; the |
| * byte after b[0] is therefore the byte after the SIB |
| * returns number of bytes 'used', including the SIB byte */ |
| size_t size = 1; /* start at 1 for SIB byte */ |
| struct SIB_byte sib; |
| |
| if ( buf_len < 1 ) { |
| return 0; |
| } |
| |
| byte_decode( *buf, (struct modRM_byte *)(void*)&sib ); /* get bit-fields */ |
| |
| if ( sib.base == SIB_BASE_EBP && ! mod ) { /* if base == 101 (ebp) */ |
| /* IF BASE == EBP, deal with exception */ |
| /* IF (ModR/M did not create a Disp */ |
| /* ... create a 32-bit Displacement */ |
| imm32_signsized( &buf[1], buf_len, &ea->disp, sizeof(int32_t)); |
| ea->disp_size = sizeof(int32_t); |
| ea->disp_sign = (ea->disp < 0) ? 1 : 0; |
| size += 4; /* add sizeof disp to count */ |
| |
| } else { |
| /* ELSE BASE refers to a General Register */ |
| ia32_handle_register( &ea->base, sib.base + 1 ); |
| } |
| |
| /* set scale to 1, 2, 4, 8 */ |
| ea->scale = 1 << sib.scale; |
| |
| if (sib.index != SIB_INDEX_NONE) { |
| /* IF INDEX is not 'ESP' (100) */ |
| ia32_handle_register( &ea->index, sib.index + 1 ); |
| } |
| |
| return (size); /* return number of bytes processed */ |
| } |
| |
| static size_t modrm_decode16( unsigned char *buf, unsigned int buf_len, |
| x86_op_t *op, struct modRM_byte *modrm ) { |
| /* 16-bit mode: hackish, but not as hackish as 32-bit mode ;) */ |
| size_t size = 1; /* # of bytes decoded [1 for modR/M byte] */ |
| x86_ea_t * ea = &op->data.expression; |
| |
| switch( modrm->rm ) { |
| case MOD16_RM_BXSI: |
| ia32_handle_register(&ea->base, REG_WORD_OFFSET + 3); |
| ia32_handle_register(&ea->index, REG_WORD_OFFSET + 6); |
| break; |
| case MOD16_RM_BXDI: |
| ia32_handle_register(&ea->base, REG_WORD_OFFSET + 3); |
| ia32_handle_register(&ea->index, REG_WORD_OFFSET + 7); |
| case MOD16_RM_BPSI: |
| op->flags |= op_ss_seg; |
| ia32_handle_register(&ea->base, REG_WORD_OFFSET + 5); |
| ia32_handle_register(&ea->index, REG_WORD_OFFSET + 6); |
| break; |
| case MOD16_RM_BPDI: |
| op->flags |= op_ss_seg; |
| ia32_handle_register(&ea->base, REG_WORD_OFFSET + 5); |
| ia32_handle_register(&ea->index, REG_WORD_OFFSET + 7); |
| break; |
| case MOD16_RM_SI: |
| ia32_handle_register(&ea->base, REG_WORD_OFFSET + 6); |
| break; |
| case MOD16_RM_DI: |
| ia32_handle_register(&ea->base, REG_WORD_OFFSET + 7); |
| break; |
| case MOD16_RM_BP: |
| if ( modrm->mod != MOD16_MOD_NODISP ) { |
| op->flags |= op_ss_seg; |
| ia32_handle_register(&ea->base, |
| REG_WORD_OFFSET + 5); |
| } |
| break; |
| case MOD16_RM_BX: |
| ia32_handle_register(&ea->base, REG_WORD_OFFSET + 3); |
| break; |
| } |
| |
| /* move to byte after ModR/M */ |
| ++buf; |
| --buf_len; |
| |
| if ( modrm->mod == MOD16_MOD_DISP8 ) { |
| imm32_signsized( buf, buf_len, &ea->disp, sizeof(char) ); |
| ea->disp_sign = (ea->disp < 0) ? 1 : 0; |
| ea->disp_size = sizeof(char); |
| size += sizeof(char); |
| } else if ( modrm->mod == MOD16_MOD_DISP16 ) { |
| imm32_signsized( buf, buf_len, &ea->disp, sizeof(short) ); |
| ea->disp_sign = (ea->disp < 0) ? 1 : 0; |
| ea->disp_size = sizeof(short); |
| size += sizeof(short); |
| } |
| |
| return size; |
| } |
| |
| /* TODO : Mark index modes |
| Use addressing mode flags to imply arrays (index), structure (disp), |
| two-dimensional arrays [disp + index], classes [ea reg], and so on. |
| */ |
| size_t ia32_modrm_decode( unsigned char *buf, unsigned int buf_len, |
| x86_op_t *op, x86_insn_t *insn, size_t gen_regs ) { |
| /* create address expression and/or fill operand based on value of |
| * ModR/M byte. Calls sib_decode as appropriate. |
| * flags specifies whether Reg or mod+R/M fields are being decoded |
| * returns the number of bytes in the instruction, including modR/M */ |
| struct modRM_byte modrm; |
| size_t size = 1; /* # of bytes decoded [1 for modR/M byte] */ |
| x86_ea_t * ea; |
| |
| |
| byte_decode(*buf, &modrm); /* get bitfields */ |
| |
| /* first, handle the case where the mod field is a register only */ |
| if ( modrm.mod == MODRM_MOD_NOEA ) { |
| op->type = op_register; |
| ia32_handle_register(&op->data.reg, modrm.rm + gen_regs); |
| /* increase insn size by 1 for modrm byte */ |
| return 1; |
| } |
| |
| /* then deal with cases where there is an effective address */ |
| ea = &op->data.expression; |
| op->type = op_expression; |
| op->flags |= op_pointer; |
| |
| if ( insn->addr_size == 2 ) { |
| /* gah! 16 bit mode! */ |
| return modrm_decode16( buf, buf_len, op, &modrm); |
| } |
| |
| /* move to byte after ModR/M */ |
| ++buf; |
| --buf_len; |
| |
| if (modrm.mod == MODRM_MOD_NODISP) { /* if mod == 00 */ |
| |
| /* IF MOD == No displacement, just Indirect Register */ |
| if (modrm.rm == MODRM_RM_NOREG) { /* if r/m == 101 */ |
| /* IF RM == No Register, just Displacement */ |
| /* This is an Intel Moronic Exception TM */ |
| imm32_signsized( buf, buf_len, &ea->disp, |
| sizeof(int32_t) ); |
| ea->disp_size = sizeof(int32_t); |
| ea->disp_sign = (ea->disp < 0) ? 1 : 0; |
| size += 4; /* add sizeof disp to count */ |
| |
| } else if (modrm.rm == MODRM_RM_SIB) { /* if r/m == 100 */ |
| /* ELSE IF an SIB byte is present */ |
| /* TODO: check for 0 retval */ |
| size += sib_decode( buf, buf_len, ea, modrm.mod); |
| /* move to byte after SIB for displacement */ |
| ++buf; |
| --buf_len; |
| } else { /* modR/M specifies base register */ |
| /* ELSE RM encodes a general register */ |
| ia32_handle_register( &ea->base, modrm.rm + 1 ); |
| } |
| } else { /* mod is 01 or 10 */ |
| if (modrm.rm == MODRM_RM_SIB) { /* rm == 100 */ |
| /* IF base is an AddrExpr specified by an SIB byte */ |
| /* TODO: check for 0 retval */ |
| size += sib_decode( buf, buf_len, ea, modrm.mod); |
| /* move to byte after SIB for displacement */ |
| ++buf; |
| --buf_len; |
| } else { |
| /* ELSE base is a general register */ |
| ia32_handle_register( &ea->base, modrm.rm + 1 ); |
| } |
| |
| /* ELSE mod + r/m specify a disp##[base] or disp##(SIB) */ |
| if (modrm.mod == MODRM_MOD_DISP8) { /* mod == 01 */ |
| /* If this is an 8-bit displacement */ |
| imm32_signsized( buf, buf_len, &ea->disp, |
| sizeof(char)); |
| ea->disp_size = sizeof(char); |
| ea->disp_sign = (ea->disp < 0) ? 1 : 0; |
| size += 1; /* add sizeof disp to count */ |
| |
| } else { |
| /* Displacement is dependent on address size */ |
| imm32_signsized( buf, buf_len, &ea->disp, |
| insn->addr_size); |
| ea->disp_size = insn->addr_size; |
| ea->disp_sign = (ea->disp < 0) ? 1 : 0; |
| size += 4; |
| } |
| } |
| |
| return size; /* number of bytes found in instruction */ |
| } |
| |
| void ia32_reg_decode( unsigned char byte, x86_op_t *op, size_t gen_regs ) { |
| struct modRM_byte modrm; |
| byte_decode( byte, &modrm ); /* get bitfields */ |
| |
| /* set operand to register ID */ |
| op->type = op_register; |
| ia32_handle_register(&op->data.reg, modrm.reg + gen_regs); |
| |
| return; |
| } |