mirror of
https://github.com/TomHarte/CLK.git
synced 2025-08-08 14:25:05 +00:00
Muddles drunkenly towards decoding ModRM.
This commit is contained in:
@@ -8,26 +8,27 @@
|
|||||||
|
|
||||||
#include "x86.hpp"
|
#include "x86.hpp"
|
||||||
|
|
||||||
|
#include <cassert>
|
||||||
|
|
||||||
using namespace CPU::Decoder::x86;
|
using namespace CPU::Decoder::x86;
|
||||||
|
|
||||||
Instruction Decoder::decode(uint8_t *source, size_t length) {
|
Instruction Decoder::decode(uint8_t *source, size_t length) {
|
||||||
uint8_t *const limit = source + length;
|
uint8_t *const limit = source + length;
|
||||||
|
|
||||||
#define MapPartial(value, op, sz, fmt, phs) \
|
#define MapPartial(value, op, lrg, fmt, phs) \
|
||||||
case value: \
|
case value: \
|
||||||
operation_ = Operation::op; \
|
operation_ = Operation::op; \
|
||||||
operand_size_ = Size::sz; \
|
large_operand_ = lrg; \
|
||||||
format_ = Format::fmt; \
|
format_ = Format::fmt; \
|
||||||
phase_ = Phase::phs; \
|
phase_ = Phase::phs; \
|
||||||
break
|
break
|
||||||
|
|
||||||
#define MapComplete(value, op, sz, src, dest) \
|
#define MapComplete(value, op, src, dest) \
|
||||||
case value: \
|
case value: \
|
||||||
operation_ = Operation::op; \
|
operation_ = Operation::op; \
|
||||||
operand_size_ = Size::sz; \
|
source_ = Source::src; \
|
||||||
source_ = Source::src; \
|
destination_ = Source::dest; \
|
||||||
destination_ = Source::dest; \
|
phase_ = Phase::ReadyToPost; \
|
||||||
phase_ = Phase::ReadyToPost; \
|
|
||||||
break
|
break
|
||||||
|
|
||||||
while(phase_ == Phase::Instruction && source != limit) {
|
while(phase_ == Phase::Instruction && source != limit) {
|
||||||
@@ -36,56 +37,56 @@ Instruction Decoder::decode(uint8_t *source, size_t length) {
|
|||||||
instr_ = *source;
|
instr_ = *source;
|
||||||
switch(instr_) {
|
switch(instr_) {
|
||||||
#define PartialBlock(start, operation) \
|
#define PartialBlock(start, operation) \
|
||||||
MapPartial(start + 0x00, operation, Byte, MemReg_Reg, ModRM); \
|
MapPartial(start + 0x00, operation, false, MemReg_Reg, ModRM); \
|
||||||
MapPartial(start + 0x01, operation, Word, MemReg_Reg, ModRM); \
|
MapPartial(start + 0x01, operation, true, MemReg_Reg, ModRM); \
|
||||||
MapPartial(start + 0x02, operation, Byte, Reg_MemReg, ModRM); \
|
MapPartial(start + 0x02, operation, false, Reg_MemReg, ModRM); \
|
||||||
MapPartial(start + 0x03, operation, Word, Reg_MemReg, ModRM); \
|
MapPartial(start + 0x03, operation, true, Reg_MemReg, ModRM); \
|
||||||
MapPartial(start + 0x04, operation, Byte, Ac_Data, AwaitingOperands); \
|
MapPartial(start + 0x04, operation, false, Ac_Data, AwaitingOperands); \
|
||||||
MapPartial(start + 0x05, operation, Word, Ac_Data, AwaitingOperands);
|
MapPartial(start + 0x05, operation, true, Ac_Data, AwaitingOperands);
|
||||||
|
|
||||||
PartialBlock(0x00, ADD);
|
PartialBlock(0x00, ADD);
|
||||||
MapComplete(0x06, PUSH, Word, ES, None);
|
MapComplete(0x06, PUSH, ES, None);
|
||||||
MapComplete(0x07, POP, Word, ES, None);
|
MapComplete(0x07, POP, ES, None);
|
||||||
|
|
||||||
PartialBlock(0x08, OR);
|
PartialBlock(0x08, OR);
|
||||||
MapComplete(0x0e, PUSH, Word, CS, None);
|
MapComplete(0x0e, PUSH, CS, None);
|
||||||
/* 0x0f: not used. */
|
/* 0x0f: not used. */
|
||||||
|
|
||||||
PartialBlock(0x10, ADC);
|
PartialBlock(0x10, ADC);
|
||||||
MapComplete(0x16, PUSH, Word, SS, None);
|
MapComplete(0x16, PUSH, SS, None);
|
||||||
MapComplete(0x17, POP, Word, SS, None);
|
MapComplete(0x17, POP, SS, None);
|
||||||
|
|
||||||
PartialBlock(0x18, SBB);
|
PartialBlock(0x18, SBB);
|
||||||
MapComplete(0x1e, PUSH, Word, DS, None);
|
MapComplete(0x1e, PUSH, DS, None);
|
||||||
MapComplete(0x1f, POP, Word, DS, None);
|
MapComplete(0x1f, POP, DS, None);
|
||||||
|
|
||||||
PartialBlock(0x20, AND);
|
PartialBlock(0x20, AND);
|
||||||
case 0x26: segment_override_ = Source::ES; break;
|
case 0x26: segment_override_ = Source::ES; break;
|
||||||
MapComplete(0x27, DAA, Implied, None, None);
|
MapComplete(0x27, DAA, None, None);
|
||||||
|
|
||||||
PartialBlock(0x28, SUB);
|
PartialBlock(0x28, SUB);
|
||||||
case 0x2e: segment_override_ = Source::CS; break;
|
case 0x2e: segment_override_ = Source::CS; break;
|
||||||
MapComplete(0x2f, DAS, Implied, None, None);
|
MapComplete(0x2f, DAS, None, None);
|
||||||
|
|
||||||
PartialBlock(0x30, XOR);
|
PartialBlock(0x30, XOR);
|
||||||
case 0x36: segment_override_ = Source::SS; break;
|
case 0x36: segment_override_ = Source::SS; break;
|
||||||
MapComplete(0x37, AAA, Implied, None, None);
|
MapComplete(0x37, AAA, None, None);
|
||||||
|
|
||||||
PartialBlock(0x38, CMP);
|
PartialBlock(0x38, CMP);
|
||||||
case 0x3e: segment_override_ = Source::DS; break;
|
case 0x3e: segment_override_ = Source::DS; break;
|
||||||
MapComplete(0x3f, AAS, Implied, None, None);
|
MapComplete(0x3f, AAS, None, None);
|
||||||
|
|
||||||
#undef PartialBlock
|
#undef PartialBlock
|
||||||
|
|
||||||
#define RegisterBlock(start, operation) \
|
#define RegisterBlock(start, operation) \
|
||||||
MapComplete(start + 0x00, operation, Word, AX, AX); \
|
MapComplete(start + 0x00, operation, AX, AX); \
|
||||||
MapComplete(start + 0x01, operation, Word, CX, CX); \
|
MapComplete(start + 0x01, operation, CX, CX); \
|
||||||
MapComplete(start + 0x02, operation, Word, DX, DX); \
|
MapComplete(start + 0x02, operation, DX, DX); \
|
||||||
MapComplete(start + 0x03, operation, Word, BX, BX); \
|
MapComplete(start + 0x03, operation, BX, BX); \
|
||||||
MapComplete(start + 0x04, operation, Word, SP, SP); \
|
MapComplete(start + 0x04, operation, SP, SP); \
|
||||||
MapComplete(start + 0x05, operation, Word, BP, BP); \
|
MapComplete(start + 0x05, operation, BP, BP); \
|
||||||
MapComplete(start + 0x06, operation, Word, SI, SI); \
|
MapComplete(start + 0x06, operation, SI, SI); \
|
||||||
MapComplete(start + 0x07, operation, Word, DI, DI); \
|
MapComplete(start + 0x07, operation, DI, DI); \
|
||||||
|
|
||||||
RegisterBlock(0x40, INC);
|
RegisterBlock(0x40, INC);
|
||||||
RegisterBlock(0x48, DEC);
|
RegisterBlock(0x48, DEC);
|
||||||
@@ -96,59 +97,68 @@ Instruction Decoder::decode(uint8_t *source, size_t length) {
|
|||||||
|
|
||||||
/* 0x60–0x6f: not used. */
|
/* 0x60–0x6f: not used. */
|
||||||
|
|
||||||
MapPartial(0x70, JO, Byte, Disp, AwaitingOperands);
|
#define MapJump(value, operation) MapPartial(value, operation, false, Disp, AwaitingOperands);
|
||||||
MapPartial(0x71, JNO, Byte, Disp, AwaitingOperands);
|
MapJump(0x70, JO);
|
||||||
MapPartial(0x72, JB, Byte, Disp, AwaitingOperands);
|
MapJump(0x71, JNO);
|
||||||
MapPartial(0x73, JNB, Byte, Disp, AwaitingOperands);
|
MapJump(0x72, JB);
|
||||||
MapPartial(0x74, JE, Byte, Disp, AwaitingOperands);
|
MapJump(0x73, JNB);
|
||||||
MapPartial(0x75, JNE, Byte, Disp, AwaitingOperands);
|
MapJump(0x74, JE);
|
||||||
MapPartial(0x76, JBE, Byte, Disp, AwaitingOperands);
|
MapJump(0x75, JNE);
|
||||||
MapPartial(0x77, JNBE, Byte, Disp, AwaitingOperands);
|
MapJump(0x76, JBE);
|
||||||
MapPartial(0x78, JS, Byte, Disp, AwaitingOperands);
|
MapJump(0x77, JNBE);
|
||||||
MapPartial(0x79, JNS, Byte, Disp, AwaitingOperands);
|
MapJump(0x78, JS);
|
||||||
MapPartial(0x7a, JP, Byte, Disp, AwaitingOperands);
|
MapJump(0x79, JNS);
|
||||||
MapPartial(0x7b, JNP, Byte, Disp, AwaitingOperands);
|
MapJump(0x7a, JP);
|
||||||
MapPartial(0x7c, JL, Byte, Disp, AwaitingOperands);
|
MapJump(0x7b, JNP);
|
||||||
MapPartial(0x7d, JNL, Byte, Disp, AwaitingOperands);
|
MapJump(0x7c, JL);
|
||||||
MapPartial(0x7e, JLE, Byte, Disp, AwaitingOperands);
|
MapJump(0x7d, JNL);
|
||||||
MapPartial(0x7f, JNLE, Byte, Disp, AwaitingOperands);
|
MapJump(0x7e, JLE);
|
||||||
|
MapJump(0x7f, JNLE);
|
||||||
|
#undef MapJump
|
||||||
|
|
||||||
// TODO:
|
// TODO:
|
||||||
//
|
//
|
||||||
// 0x80, 0x81, 0x82, 0x83, which all require more
|
// 0x80, 0x81, 0x82, 0x83, which all require more
|
||||||
// input, from the ModRM byte.
|
// input, from the ModRM byte.
|
||||||
|
|
||||||
MapPartial(0x84, TEST, Byte, MemReg_Reg, ModRM);
|
MapPartial(0x84, TEST, false, MemReg_Reg, ModRM);
|
||||||
MapPartial(0x85, TEST, Word, MemReg_Reg, ModRM);
|
MapPartial(0x85, TEST, true, MemReg_Reg, ModRM);
|
||||||
MapPartial(0x86, XCHG, Byte, Reg_MemReg, ModRM);
|
MapPartial(0x86, XCHG, false, Reg_MemReg, ModRM);
|
||||||
MapPartial(0x87, XCHG, Word, Reg_MemReg, ModRM);
|
MapPartial(0x87, XCHG, true, Reg_MemReg, ModRM);
|
||||||
MapPartial(0x88, MOV, Byte, MemReg_Reg, ModRM);
|
MapPartial(0x88, MOV, false, MemReg_Reg, ModRM);
|
||||||
MapPartial(0x89, MOV, Word, MemReg_Reg, ModRM);
|
MapPartial(0x89, MOV, true, MemReg_Reg, ModRM);
|
||||||
MapPartial(0x8a, MOV, Byte, Reg_MemReg, ModRM);
|
MapPartial(0x8a, MOV, false, Reg_MemReg, ModRM);
|
||||||
MapPartial(0x8b, MOV, Word, Reg_MemReg, ModRM);
|
MapPartial(0x8b, MOV, true, Reg_MemReg, ModRM);
|
||||||
/* 0x8c: not used. */
|
/* 0x8c: not used. */
|
||||||
MapPartial(0x8d, LEA, Word, Reg_Addr, ModRM);
|
MapPartial(0x8d, LEA, true, Reg_Addr, ModRM);
|
||||||
MapPartial(0x8e, MOV, Word, SegReg_MemReg, ModRM);
|
MapPartial(0x8e, MOV, true, SegReg_MemReg, ModRM);
|
||||||
|
|
||||||
// TODO: 0x8f, which requires further selection from the ModRM byte.
|
// TODO: 0x8f, which requires further selection from the ModRM byte.
|
||||||
|
|
||||||
MapComplete(0x90, NOP, Implied, None, None); // Or XCHG AX, AX?
|
MapComplete(0x90, NOP, None, None); // Or XCHG AX, AX?
|
||||||
MapComplete(0x91, XCHG, Word, AX, CX);
|
MapComplete(0x91, XCHG, AX, CX);
|
||||||
MapComplete(0x92, XCHG, Word, AX, DX);
|
MapComplete(0x92, XCHG, AX, DX);
|
||||||
MapComplete(0x93, XCHG, Word, AX, BX);
|
MapComplete(0x93, XCHG, AX, BX);
|
||||||
MapComplete(0x94, XCHG, Word, AX, SP);
|
MapComplete(0x94, XCHG, AX, SP);
|
||||||
MapComplete(0x95, XCHG, Word, AX, BP);
|
MapComplete(0x95, XCHG, AX, BP);
|
||||||
MapComplete(0x96, XCHG, Word, AX, SI);
|
MapComplete(0x96, XCHG, AX, SI);
|
||||||
MapComplete(0x97, XCHG, Word, AX, DI);
|
MapComplete(0x97, XCHG, AX, DI);
|
||||||
|
|
||||||
MapComplete(0x98, CBW, Implied, None, None);
|
MapComplete(0x98, CBW, None, None);
|
||||||
MapComplete(0x99, CWD, Implied, None, None);
|
MapComplete(0x99, CWD, None, None);
|
||||||
MapPartial(0x9a, CALL, Word, Disp, AwaitingOperands);
|
MapPartial(0x9a, CALL, true, Addr, AwaitingOperands);
|
||||||
MapComplete(0x9b, WAIT, Implied, None, None);
|
MapComplete(0x9b, WAIT, None, None);
|
||||||
MapComplete(0x9c, PUSHF, Implied, None, None);
|
MapComplete(0x9c, PUSHF, None, None);
|
||||||
MapComplete(0x9d, POPF, Implied, None, None);
|
MapComplete(0x9d, POPF, None, None);
|
||||||
MapComplete(0x9e, SAHF, Implied, None, None);
|
MapComplete(0x9e, SAHF, None, None);
|
||||||
MapComplete(0x9f, LAHF, Implied, None, None);
|
MapComplete(0x9f, LAHF, None, None);
|
||||||
|
|
||||||
|
MapPartial(0xa0, MOV, false, Reg_Addr, AwaitingOperands);
|
||||||
|
|
||||||
|
// Other prefix bytes.
|
||||||
|
case 0xf0: lock_ = true; break;
|
||||||
|
case 0xf2: repetition_ = Repetition::RepNE; break;
|
||||||
|
case 0xf3: repetition_ = Repetition::RepE; break;
|
||||||
}
|
}
|
||||||
++source;
|
++source;
|
||||||
++consumed_;
|
++consumed_;
|
||||||
@@ -156,6 +166,74 @@ Instruction Decoder::decode(uint8_t *source, size_t length) {
|
|||||||
|
|
||||||
#undef MapInstr
|
#undef MapInstr
|
||||||
|
|
||||||
|
if(phase_ == Phase::ModRM && source != limit) {
|
||||||
|
const uint8_t mod = *source >> 6; // i.e. mode.
|
||||||
|
const uint8_t reg = (*source >> 3) & 7; // i.e. register.
|
||||||
|
const uint8_t rm = *source & 7; // i.e. register/memory.
|
||||||
|
|
||||||
|
switch(format_) {
|
||||||
|
case Format::Reg_MemReg:
|
||||||
|
case Format::MemReg_Reg: {
|
||||||
|
Source memreg;
|
||||||
|
|
||||||
|
constexpr Source reg_table[2][8] = {
|
||||||
|
{
|
||||||
|
Source::AL, Source::CL, Source::DL, Source::BL,
|
||||||
|
Source::AH, Source::CH, Source::DH, Source::BH,
|
||||||
|
}, {
|
||||||
|
Source::AX, Source::CX, Source::DX, Source::BX,
|
||||||
|
Source::SP, Source::BP, Source::SI, Source::DI,
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
switch(mod) {
|
||||||
|
case 0: {
|
||||||
|
add_offset_ = false;
|
||||||
|
constexpr Source rm_table[8] = {
|
||||||
|
Source::IndBXPlusSI, Source::IndBXPlusDI,
|
||||||
|
Source::IndBPPlusSI, Source::IndBPPlusDI,
|
||||||
|
Source::IndSI, Source::IndDI,
|
||||||
|
Source::DirectAddress, Source::IndBX,
|
||||||
|
};
|
||||||
|
memreg = rm_table[rm];
|
||||||
|
} break;
|
||||||
|
|
||||||
|
default: {
|
||||||
|
add_offset_ = true;
|
||||||
|
large_offset_ = (mod == 2);
|
||||||
|
constexpr Source rm_table[8] = {
|
||||||
|
Source::IndBXPlusSI, Source::IndBXPlusDI,
|
||||||
|
Source::IndBPPlusSI, Source::IndBPPlusDI,
|
||||||
|
Source::IndSI, Source::IndDI,
|
||||||
|
Source::IndBP, Source::IndBX,
|
||||||
|
};
|
||||||
|
memreg = rm_table[rm];
|
||||||
|
} break;
|
||||||
|
|
||||||
|
// Other operand is just a register.
|
||||||
|
case 3: memreg = reg_table[large_operand_][rm]; break;
|
||||||
|
}
|
||||||
|
|
||||||
|
if(format_ == Format::Reg_MemReg) {
|
||||||
|
destination_ = reg_table[large_operand_][reg];
|
||||||
|
source_ = memreg;
|
||||||
|
} else {
|
||||||
|
source_ = reg_table[large_operand_][reg];
|
||||||
|
destination_ = memreg;
|
||||||
|
}
|
||||||
|
phase_ = (add_offset_ || memreg == Source::DirectAddress) ? Phase::AwaitingOperands : Phase::ReadyToPost;
|
||||||
|
} break;
|
||||||
|
|
||||||
|
default: assert(false);
|
||||||
|
}
|
||||||
|
|
||||||
|
++source;
|
||||||
|
++consumed_;
|
||||||
|
}
|
||||||
|
|
||||||
|
if(phase_ == Phase::AwaitingOperands && source != limit) {
|
||||||
|
// TODO: calculate number of expected operands.
|
||||||
|
}
|
||||||
|
|
||||||
if(phase_ == Phase::ReadyToPost) {
|
if(phase_ == Phase::ReadyToPost) {
|
||||||
// TODO: construct actual Instruction.
|
// TODO: construct actual Instruction.
|
||||||
|
@@ -46,6 +46,7 @@ enum class Size: uint8_t {
|
|||||||
Implied = 0,
|
Implied = 0,
|
||||||
Byte = 1,
|
Byte = 1,
|
||||||
Word = 2,
|
Word = 2,
|
||||||
|
DWord = 4,
|
||||||
};
|
};
|
||||||
|
|
||||||
enum class Source: uint8_t {
|
enum class Source: uint8_t {
|
||||||
@@ -60,7 +61,17 @@ enum class Source: uint8_t {
|
|||||||
SI, DI,
|
SI, DI,
|
||||||
BP, SP,
|
BP, SP,
|
||||||
|
|
||||||
Memory, Immediate
|
IndBXPlusSI,
|
||||||
|
IndBXPlusDI,
|
||||||
|
IndBPPlusSI,
|
||||||
|
IndBPPlusDI,
|
||||||
|
IndSI,
|
||||||
|
IndDI,
|
||||||
|
DirectAddress,
|
||||||
|
IndBP,
|
||||||
|
IndBX,
|
||||||
|
|
||||||
|
Immediate
|
||||||
};
|
};
|
||||||
|
|
||||||
class Instruction {
|
class Instruction {
|
||||||
@@ -111,16 +122,28 @@ struct Decoder {
|
|||||||
MemReg_Data,
|
MemReg_Data,
|
||||||
SegReg_MemReg,
|
SegReg_MemReg,
|
||||||
Reg_Addr,
|
Reg_Addr,
|
||||||
Disp
|
Addr_Reg,
|
||||||
|
Disp,
|
||||||
|
Addr
|
||||||
} format_ = Format::MemReg_Reg;
|
} format_ = Format::MemReg_Reg;
|
||||||
|
// TODO: figure out which Formats can be folded together,
|
||||||
|
// and which are improperly elided.
|
||||||
|
|
||||||
|
enum class Repetition: uint8_t {
|
||||||
|
None, RepE, RepNE
|
||||||
|
} repetition_ = Repetition::None;
|
||||||
|
|
||||||
|
|
||||||
int consumed_ = 0;
|
int consumed_ = 0;
|
||||||
Operation operation_ = Operation::Invalid;
|
Operation operation_ = Operation::Invalid;
|
||||||
Size operand_size_ = Size::Implied;
|
bool large_operand_ = false;
|
||||||
Source source_ = Source::None;
|
Source source_ = Source::None;
|
||||||
Source destination_ = Source::None;
|
Source destination_ = Source::None;
|
||||||
Source segment_override_ = Source::None;
|
Source segment_override_ = Source::None;
|
||||||
uint8_t instr_ = 0x00;
|
uint8_t instr_ = 0x00;
|
||||||
|
bool lock_ = false;
|
||||||
|
bool add_offset_ = false;
|
||||||
|
bool large_offset_ = false;
|
||||||
};
|
};
|
||||||
|
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user