1
0
mirror of https://github.com/TomHarte/CLK.git synced 2024-12-01 11:49:58 +00:00
CLK/OSBindings/Mac/Clock SignalTests/x86DecoderTests.mm
2023-10-27 12:54:42 -04:00

683 lines
27 KiB
Plaintext

//
// x86DecoderTests.m
// Clock Signal
//
// Created by Thomas Harte on 03/01/2021.
// Copyright 2021 Thomas Harte. All rights reserved.
//
#import <XCTest/XCTest.h>
#include <initializer_list>
#include <optional>
#include <vector>
#include "../../../InstructionSets/x86/Decoder.hpp"
using namespace InstructionSet::x86;
namespace {
// MARK: - Specific instruction asserts.
template <typename InstructionT> void test(const InstructionT &instruction, DataSize size, Operation operation) {
XCTAssertEqual(instruction.operation_size(), InstructionSet::x86::DataSize(size));
XCTAssertEqual(instruction.operation(), operation);
}
template <typename InstructionT> void test(
const InstructionT &instruction,
DataSize size,
Operation operation,
std::optional<InstructionSet::x86::DataPointer> source,
std::optional<InstructionSet::x86::DataPointer> destination = std::nullopt,
std::optional<typename InstructionT::ImmediateT> operand = std::nullopt,
std::optional<typename InstructionT::DisplacementT> displacement = std::nullopt) {
XCTAssertEqual(instruction.operation_size(), InstructionSet::x86::DataSize(size));
XCTAssertEqual(instruction.operation(), operation);
if(source) XCTAssert(instruction.source() == *source);
if(destination) XCTAssert(instruction.destination() == *destination);
if(operand) XCTAssertEqual(instruction.operand(), *operand);
if(displacement) XCTAssertEqual(instruction.displacement(), *displacement);
}
template <typename InstructionT> void test(
const InstructionT &instruction,
Operation operation,
std::optional<typename InstructionT::ImmediateT> operand = std::nullopt,
std::optional<typename InstructionT::DisplacementT> displacement = std::nullopt) {
XCTAssertEqual(instruction.operation(), operation);
if(operand) XCTAssertEqual(instruction.operand(), *operand);
if(displacement) XCTAssertEqual(instruction.displacement(), *displacement);
}
template <typename InstructionT> void test_far(
const InstructionT &instruction,
Operation operation,
uint16_t segment,
typename InstructionT::DisplacementT offset) {
XCTAssertEqual(instruction.operation(), operation);
XCTAssertEqual(instruction.segment(), segment);
XCTAssertEqual(instruction.offset(), offset);
}
// MARK: - Decoder
template <Model model, typename CollectionT>
std::vector<typename InstructionSet::x86::Decoder<model>::InstructionT>
decode(const CollectionT &stream, bool set_32_bit = false) {
// Build instructions list with a byte-by-byte decoding.
std::vector<typename InstructionSet::x86::Decoder<model>::InstructionT> instructions;
InstructionSet::x86::Decoder<model> decoder;
decoder.set_32bit_protected_mode(set_32_bit);
for(uint8_t item: stream) {
const auto [size, next] = decoder.decode(&item, 1);
if(size > 0) {
instructions.push_back(next);
}
}
return instructions;
}
template <Model model>
std::vector<typename InstructionSet::x86::Decoder<model>::InstructionT>
decode(const std::initializer_list<uint8_t> &stream, bool set_32_bit = false) {
// Decode by offering up all data at once.
std::vector<typename InstructionSet::x86::Decoder<model>::InstructionT> instructions;
InstructionSet::x86::Decoder<model> decoder;
decoder.set_32bit_protected_mode(set_32_bit);
instructions.clear();
const uint8_t *byte = stream.begin();
while(byte != stream.end()) {
const auto [size, next] = decoder.decode(byte, stream.end() - byte);
if(size <= 0) break;
instructions.push_back(next);
byte += size;
}
// Grab a byte-at-a-time decoding and check that it matches the previous.
const auto byte_instructions = decode<model>(std::vector<uint8_t>{stream}, set_32_bit);
XCTAssertEqual(byte_instructions.size(), instructions.size());
auto previous_instruction = instructions.begin();
auto byte_instruction = byte_instructions.begin();
while(previous_instruction != instructions.end()) {
XCTAssert(*previous_instruction == *byte_instruction);
++previous_instruction;
++byte_instruction;
}
return instructions;
}
}
@interface x86DecoderTests : XCTestCase
@end
/*!
Tests 8086 decoding by throwing a bunch of randomly-generated
word streams and checking that the result matches what I got from a
disassembler elsewhere.
*/
@implementation x86DecoderTests
- (void)test16BitSequence {
// Sequences the Online Disassembler believes to exist but The 8086 Book does not:
//
// 0x6a 0x65 push $65
// 0x65 0x6d gs insw (%dx),%es:(%di)
// 0x67 0x61 addr32 popa
// 0x6c insb (%dx), %es:(%di)
// 0xc9 leave
//
const auto instructions = decode<Model::i8086>({
0x2d, 0x77, 0xea, 0x72, 0xfc, 0x4b, 0xb5, 0x28, 0xc3, 0xca, 0x26, 0x48, /* 0x65, 0x6d, */ 0x7b, 0x9f,
0xc2, 0x65, 0x42, 0x4e, 0xef, 0x70, 0x20, 0x94, 0xc4, 0xd4, 0x93, 0x43, 0x3c, 0x8e, /* 0x6a, 0x65, */
0x1a, 0x78, 0x45, 0x10, 0x7f, 0x3c, 0x19, 0x5a, 0x16, 0x31, 0x64, 0x2c, 0xe7, 0xc6, 0x7d, 0xb0,
0xb5, 0x49, /* 0x67, 0x61, */ 0xba, 0xc0, 0xcb, 0x14, 0x7e, 0x71, 0xd0, 0x50, 0x78, 0x3d, 0x03, 0x1d,
0xe5, 0xc9, 0x97, 0xc3, 0x9b, 0xe6, 0xd3, /* 0x6c, */ 0x58, 0x4d, 0x76, 0x80, 0x44, 0xd6, 0x9f, 0xa5,
0xbd, 0xa1, 0x12, 0xc5, 0x29, /* 0xc9, */ 0x9e, 0xd8, 0xf3, 0xcf, 0x92, 0x39, 0x5d, 0x90, 0x15, 0xc3,
0xb8, 0xad, 0xe8, 0xc8, 0x16, 0x4a, 0xb0, 0x9e, 0xf9, 0xbf, 0x56, 0xea, 0x4e, 0xfd, 0xe4, 0x5a,
0x23, 0xaa, 0x2c, 0x5b, 0x2a, 0xd2, 0xf7, 0x5f, 0x18, 0x86, 0x90, 0x25, 0x64, 0xb7, 0xc3
});
// 63 instructions are expected.
XCTAssertEqual(instructions.size(), 63);
// sub $0xea77,%ax
// jb 0x00000001
// dec %bx
// mov $0x28,%ch
test(instructions[0], DataSize::Word, Operation::SUB, Source::Immediate, Source::eAX, 0xea77);
test(instructions[1], Operation::JB, std::nullopt, 0xfffc);
test(instructions[2], DataSize::Word, Operation::DEC, Source::eBX, Source::eBX);
test(instructions[3], DataSize::Byte, Operation::MOV, Source::Immediate, Source::CH, 0x28);
// ret
// lret $0x4826
// [[ omitted: gs insw (%dx),%es:(%di) ]]
// jnp 0xffffffaf
// ret $0x4265
test(instructions[4], Operation::RETnear);
test(instructions[5], Operation::RETfar, 0x4826);
test(instructions[6], Operation::JNP, std::nullopt, 0xff9f);
test(instructions[7], Operation::RETnear, 0x4265);
// dec %si
// out %ax,(%dx)
// jo 0x00000037
// xchg %ax,%sp
test(instructions[8], DataSize::Word, Operation::DEC, Source::eSI, Source::eSI);
test(instructions[9], DataSize::Word, Operation::OUT, Source::eAX, Source::eDX);
test(instructions[10], Operation::JO, std::nullopt, 0x20);
test(instructions[11], DataSize::Word, Operation::XCHG, Source::eAX, Source::eSP);
// ODA has:
// c4 (bad)
// d4 93 aam $0x93
//
// That assumes that upon discovering that the d4 doesn't make a valid LES,
// it can become an instruction byte. I'm not persuaded. So I'm taking:
//
// c4 d4 (bad)
// 93 XCHG AX, BX
test(instructions[12], Operation::Invalid);
test(instructions[13], DataSize::Word, Operation::XCHG, Source::eAX, Source::eBX);
// inc %bx
// cmp $0x8e,%al
// [[ omitted: push $0x65 ]]
// sbb 0x45(%bx,%si),%bh
// adc %bh,0x3c(%bx)
test(instructions[14], DataSize::Word, Operation::INC, Source::eBX, Source::eBX);
test(instructions[15], DataSize::Byte, Operation::CMP, Source::Immediate, Source::eAX, 0x8e);
test(instructions[16], DataSize::Byte, Operation::SBB, ScaleIndexBase(Source::eBX, Source::eSI), Source::BH, std::nullopt, 0x45);
test(instructions[17], DataSize::Byte, Operation::ADC, Source::BH, ScaleIndexBase(Source::eBX), std::nullopt, 0x3c);
// sbb %bx,0x16(%bp,%si)
// xor %sp,0x2c(%si)
// out %ax,$0xc6
// jge 0xffffffe0
test(instructions[18], DataSize::Word, Operation::SBB, Source::eBX, ScaleIndexBase(Source::eBP, Source::eSI), std::nullopt, 0x16);
test(instructions[19], DataSize::Word, Operation::XOR, Source::eSP, ScaleIndexBase(Source::eSI), std::nullopt, 0x2c);
test(instructions[20], DataSize::Word, Operation::OUT, Source::eAX, Source::DirectAddress, 0xc6);
test(instructions[21], Operation::JNL, std::nullopt, 0xffb0);
// mov $0x49,%ch
// [[ omitted: addr32 popa ]]
// mov $0xcbc0,%dx
// adc $0x7e,%al
// jno 0x0000000b
test(instructions[22], DataSize::Byte, Operation::MOV, Source::Immediate, Source::CH, 0x49);
test(instructions[23], DataSize::Word, Operation::MOV, Source::Immediate, Source::eDX, 0xcbc0);
test(instructions[24], DataSize::Byte, Operation::ADC, Source::Immediate, Source::eAX, 0x7e);
test(instructions[25], Operation::JNO, std::nullopt, 0xffd0);
// push %ax
// js 0x0000007b
// add (%di),%bx
// in $0xc9,%ax
test(instructions[26], DataSize::Word, Operation::PUSH, Source::eAX);
test(instructions[27], Operation::JS, std::nullopt, 0x3d);
test(instructions[28], DataSize::Word, Operation::ADD, ScaleIndexBase(Source::eDI), Source::eBX);
test(instructions[29], DataSize::Word, Operation::IN, Source::DirectAddress, Source::eAX, 0xc9);
// xchg %ax,%di
// ret
// fwait
// out %al,$0xd3
test(instructions[30], DataSize::Word, Operation::XCHG, Source::eAX, Source::eDI);
test(instructions[31], Operation::RETnear);
test(instructions[32], Operation::WAIT);
test(instructions[33], DataSize::Byte, Operation::OUT, Source::eAX, Source::DirectAddress, 0xd3);
// [[ omitted: insb (%dx),%es:(%di) ]]
// pop %ax
// dec %bp
// jbe 0xffffffcc
// inc %sp
test(instructions[34], DataSize::Word, Operation::POP, Source::eAX, Source::eAX);
test(instructions[35], DataSize::Word, Operation::DEC, Source::eBP, Source::eBP);
test(instructions[36], Operation::JBE, std::nullopt, 0xff80);
test(instructions[37], DataSize::Word, Operation::INC, Source::eSP, Source::eSP);
// (bad)
// lahf
// movsw %ds:(%si),%es:(%di)
// mov $0x12a1,%bp
test(instructions[38], Operation::Invalid);
test(instructions[39], Operation::LAHF);
test(instructions[40], DataSize::Word, Operation::MOVS); // Arguments are implicit.
test(instructions[41], DataSize::Word, Operation::MOV, Source::Immediate, Source::eBP, 0x12a1);
// lds (%bx,%di),%bp
// [[ omitted: leave ]]
// sahf
// fdiv %st(3),%st
// iret
test(instructions[42], DataSize::Word, Operation::LDS);
test(instructions[43], Operation::SAHF);
test(instructions[44], Operation::ESC);
test(instructions[45], Operation::IRET);
// xchg %ax,%dx
// cmp %bx,-0x70(%di)
// adc $0xb8c3,%ax
// lods %ds:(%si),%ax
test(instructions[46], DataSize::Word, Operation::XCHG, Source::eAX, Source::eDX);
test(instructions[47], DataSize::Word, Operation::CMP, Source::eBX, ScaleIndexBase(Source::eDI), std::nullopt, 0xff90);
test(instructions[48], DataSize::Word, Operation::ADC, Source::Immediate, Source::eAX, 0xb8c3);
test(instructions[49], DataSize::Word, Operation::LODS);
// call 0x0000172d
// dec %dx
// mov $0x9e,%al
// stc
test(instructions[50], Operation::CALLrel, 0, 0x16c8);
test(instructions[51], DataSize::Word, Operation::DEC, Source::eDX, Source::eDX);
test(instructions[52], DataSize::Byte, Operation::MOV, Source::Immediate, Source::eAX, 0x9e);
test(instructions[53], Operation::STC);
// mov $0xea56,%di
// dec %si
// std
// in $0x5a,%al
test(instructions[54], DataSize::Word, Operation::MOV, Source::Immediate, Source::eDI, 0xea56);
test(instructions[55], DataSize::Word, Operation::DEC, Source::eSI, Source::eSI);
test(instructions[56], Operation::STD);
test(instructions[57], DataSize::Byte, Operation::IN, Source::DirectAddress, Source::eAX, 0x5a);
// and 0x5b2c(%bp,%si),%bp
// sub %dl,%dl
// negw 0x18(%bx)
// xchg %dl,0x6425(%bx,%si)
test(instructions[58], DataSize::Word, Operation::AND, ScaleIndexBase(Source::eBP, Source::eSI), Source::eBP, std::nullopt, 0x5b2c);
test(instructions[59], DataSize::Byte, Operation::SUB, Source::eDX, Source::eDX);
test(instructions[60], DataSize::Word, Operation::NEG, ScaleIndexBase(Source::eBX), ScaleIndexBase(Source::eBX), std::nullopt, 0x18);
test(instructions[61], DataSize::Byte, Operation::XCHG, ScaleIndexBase(Source::eBX, Source::eSI), Source::eDX, std::nullopt, 0x6425);
// mov $0xc3,%bh
test(instructions[62], DataSize::Byte, Operation::MOV, Source::Immediate, Source::BH, 0xc3);
}
- (void)test83 {
const auto instructions = decode<Model::i8086>({
0x83, 0x10, 0x80, // adcw $0xff80,(%bx,%si)
0x83, 0x3b, 0x04, // cmpw $0x4,(%bp,%di)
0x83, 0x2f, 0x09, // subw $0x9,(%bx)
});
XCTAssertEqual(instructions.size(), 3);
test(instructions[0], DataSize::Word, Operation::ADC, Source::Immediate, ScaleIndexBase(Source::eBX, Source::eSI), 0xff80);
test(instructions[1], DataSize::Word, Operation::CMP, Source::Immediate, ScaleIndexBase(Source::eBP, Source::eDI), 0x4);
test(instructions[2], DataSize::Word, Operation::SUB, Source::Immediate, ScaleIndexBase(Source::eBX), 0x9);
}
- (void)testFar {
const auto instructions = decode<Model::i8086>({
0x9a, 0x12, 0x34, 0x56, 0x78, // lcall 0x7856, 0x3412
});
XCTAssertEqual(instructions.size(), 1);
test_far(instructions[0], Operation::CALLfar, 0x7856, 0x3412);
}
- (void)testLDSLESEtc {
auto run_test = [](bool is_32, DataSize size) {
const auto instructions = decode<Model::i80386>({
0xc5, 0x33, // 16-bit: lds si, (bp, di); 32-bit: lds esi, (ebx)
0xc4, 0x17, // 16-bit: les dx, (bx); 32-bit: les edx, (edi)
0x0f, 0xb2, 0x17, // 16-bit: lss dx, (bx); 32-bit: lss edx, (edi)
}, is_32);
XCTAssertEqual(instructions.size(), 3);
if(is_32) {
test(instructions[0], size, Operation::LDS, ScaleIndexBase(Source::eBX), Source::eSI);
test(instructions[1], size, Operation::LES, ScaleIndexBase(Source::eDI), Source::eDX);
test(instructions[2], size, Operation::LSS, ScaleIndexBase(Source::eDI), Source::eDX);
} else {
test(instructions[0], size, Operation::LDS, ScaleIndexBase(Source::eBP, Source::eDI), Source::eSI);
test(instructions[1], size, Operation::LES, ScaleIndexBase(Source::eBX), Source::eDX);
test(instructions[2], size, Operation::LSS, ScaleIndexBase(Source::eBX), Source::eDX);
}
};
run_test(false, DataSize::Word);
run_test(true, DataSize::DWord);
}
- (void)testSIB {
const auto instructions = decode<Model::i80386>({
// add edx, -0x7d(ebp + eax*2)
0x01, 0x54, 0x45, 0x83,
// add edx, -0x80(si)
0x67, 0x01, 0x54, 0x80,
}, true);
XCTAssertEqual(instructions.size(), 2);
test(instructions[0], DataSize::DWord, Operation::ADD, Source::eDX, ScaleIndexBase(1, Source::eAX, Source::eBP), 0x00, -125);
test(instructions[1], DataSize::DWord, Operation::ADD, Source::eDX, ScaleIndexBase(Source::eSI), 0x00, -128);
XCTAssertEqual(instructions[1].address_size(), AddressSize::b16);
}
- (void)testJMP {
const auto instructions = decode<Model::i80386>({
// JMP +0x00efcdab
0xe9, 0xab, 0xcd, 0xef, 0x00,
// JMP 0xc389:0x67452301
0xea, 0x01, 0x23, 0x45, 0x67, 0x89, 0xc3,
// JMP -79
0xeb, 0xb1,
// JMP DWORD (edx)
0xff, 0x22,
// JMP FWORD (eax)
0xff, 0x28,
}, true);
XCTAssertEqual(instructions.size(), 5);
test(instructions[0], Operation::JMPrel, 0, 0xefcdab);
test_far(instructions[1], Operation::JMPfar, 0xc389, 0x67452301);
test(instructions[2], Operation::JMPrel, 0, -79);
test(instructions[3], DataSize::DWord, Operation::JMPabs, ScaleIndexBase(Source::eDX));
test(instructions[4], DataSize::DWord, Operation::JMPfar, ScaleIndexBase(Source::eAX));
}
- (void)test32bitSequence {
const auto instructions = decode<Model::i80386>({
0x2e, 0x42, 0x0c, 0x09, 0x81, 0x47, 0xbe, 0xa9, 0x3a, 0x68, 0x9f, 0xf0, 0x7a, 0xe2, 0x3e, 0xb4,
0xc1, 0x1f, 0xaa, 0x60, 0xb4, 0xe1, 0x91, 0xdc, 0xf6, 0x62, 0x90, 0x90, 0xdf, 0xcd, 0xf9, 0x0f,
0xbb, 0x71, 0x4b, 0x58, 0x55, 0x38, 0x2c, 0xf9, 0x50, 0xfe, 0xce, 0xe0, 0xc1, 0xda, 0x83, 0x8c,
0x19, 0x0c, 0x9b, 0x89, 0x13, 0x34, 0x45, 0xc5, 0x11, 0xa2, 0xd3, 0xa6, 0xdb, 0xe4, 0x1f, 0xa5,
0x79, 0xf3, 0x7d, 0x1c, 0xb8, 0xda, 0x6b, 0x76, 0x8a, 0x79, 0x28, 0x52, 0xcd, 0xc4, 0xe9, 0xba,
0x11, 0xcf, 0x29, 0x09, 0x46, 0x1a, 0xc0, 0x5d, 0x88, 0x34, 0xa5, 0x83, 0xe2, 0xd0, 0xf5, 0x44,
0x9d, 0xa5, 0xc1, 0x5e, 0x4f, 0x07, 0x51, 0xd4, 0xed, 0xb0, 0x69, 0xd7, 0x00, 0xc5, 0x51, 0xfb,
0x68, 0x85, 0x3a, 0x8b, 0x69, 0x28, 0x0c, 0xec, 0xb1, 0xb7, 0x3b, 0x8d, 0x5f, 0x44, 0x87, 0x2c,
0xe3, 0x02, 0x9e, 0x74, 0x6e, 0x1b, 0x8f, 0x4d, 0xc5, 0x33, 0x04, 0x9f, 0xac, 0xc0, 0xc9, 0x60,
0x9a, 0x8a, 0xf5, 0xd0, 0x97, 0x1b, 0xe2, 0x64, 0x60, 0xb0, 0xcf, 0xe3, 0x37,
}, true);
XCTAssertEqual(instructions.size(), 64);
// cs inc edx
// or al,0x9
// add DWORD PTR [edi-0x42],0x9f683aa9
// lock jp 0xfffffff0 (from 0000000e)
test(instructions[0], DataSize::DWord, Operation::INC, Source::eDX);
XCTAssertEqual(instructions[0].data_segment(), Source::CS);
test(instructions[1], DataSize::Byte, Operation::OR, Source::Immediate, Source::eAX, 0x9);
test(instructions[2], DataSize::DWord, Operation::ADD, Source::Immediate, ScaleIndexBase(Source::eDI), 0x9f683aa9, -0x42);
test(instructions[3], Operation::JP, 0, -30);
XCTAssert(instructions[3].lock());
// ds mov ah,0xc1
// pop ds
// stos BYTE PTR es:[edi],al
// pusha
test(instructions[4], DataSize::Byte, Operation::MOV, Source::Immediate, Source::AH, 0xc1);
XCTAssertEqual(instructions[4].data_segment(), Source::DS);
test(instructions[5], DataSize::Word, Operation::POP, Source::None, Source::DS);
test(instructions[6], DataSize::Byte, Operation::STOS);
test(instructions[7], Operation::PUSHA);
// mov ah,0xe1
// xchg ecx,eax
// fdivr st(6),st
// bound edx,QWORD PTR [eax-0x6322070]
test(instructions[8], DataSize::Byte, Operation::MOV, Source::Immediate, Source::AH, 0xe1);
test(instructions[9], DataSize::DWord, Operation::XCHG, Source::eAX, Source::eCX);
test(instructions[10], DataSize::None, Operation::ESC);
test(instructions[11], DataSize::DWord, Operation::BOUND, ScaleIndexBase(Source::eAX), Source::eDX, 0, -0x6322070);
// btc DWORD PTR [ecx+0x4b],esi
// pop eax
// push ebp
// cmp BYTE PTR [ecx+edi*8],ch
test(instructions[12], DataSize::DWord, Operation::BTC, Source::eSI, ScaleIndexBase(Source::eCX), 0, 0x4b);
test(instructions[13], DataSize::DWord, Operation::POP, Source::eAX, Source::eAX);
test(instructions[14], DataSize::DWord, Operation::PUSH, Source::eBP);
test(instructions[15], DataSize::Byte, Operation::CMP, Source::CH, ScaleIndexBase(3, Source::eDI, Source::eCX));
// Possibly TODO: pick a lane on whether PUSH/POP duplicate source and destination.
// It doesn't really matter outside of these tests though.
// push eax
// dec dh
// loopne 0xffffffee (from 0x2d)
// fiadd DWORD PTR [ebx-0x64f3e674]
test(instructions[16], DataSize::DWord, Operation::PUSH, Source::eAX);
test(instructions[17], DataSize::Byte, Operation::DEC, Source::DH);
test(instructions[18], Operation::LOOPNE, 0, -63);
test(instructions[19], Operation::ESC);
// mov DWORD PTR [ebx],edx
// xor al,0x45
// lds edx,FWORD PTR [ecx]
// mov ds:0xe4dba6d3,al
test(instructions[20], DataSize::DWord, Operation::MOV, Source::eDX, ScaleIndexBase(Source::eBX));
test(instructions[21], DataSize::Byte, Operation::XOR, Source::Immediate, Source::eAX, 0x45);
test(instructions[22], DataSize::DWord, Operation::LDS, ScaleIndexBase(Source::eCX), Source::eDX);
test(instructions[23], DataSize::Byte, Operation::MOV, Source::eAX, Source::DirectAddress, 0xe4dba6d3);
XCTAssertEqual(instructions[23].data_segment(), Source::DS);
// pop ds
// movs DWORD PTR es:[edi],DWORD PTR ds:[esi]
// jns 0x00000035 (from 0x42)
// jge 0x00000060 (from 0x44)
test(instructions[24], DataSize::Word, Operation::POP, Source::None, Source::DS);
test(instructions[25], DataSize::DWord, Operation::MOVS);
test(instructions[26], Operation::JNS, 0, -0xd);
test(instructions[27], Operation::JNL, 0, 0x1c);
// mov eax,0x8a766bda
// jns 0x00000073 (from 0x4b)
// push edx
// int 0xc4
test(instructions[28], DataSize::DWord, Operation::MOV, Source::Immediate, Source::eAX, 0x8a766bda);
test(instructions[29], Operation::JNS, 0, 0x28);
test(instructions[30], DataSize::DWord, Operation::PUSH, Source::eDX);
test(instructions[31], Operation::INT, 0xc4);
// jmp 0x29cf120d (from 0x53)
// or DWORD PTR [esi+0x1a],eax
// rcr BYTE PTR [ebp-0x78],0x34
// movs DWORD PTR es:[edi],DWORD PTR ds:[esi]
test(instructions[32], Operation::JMPrel, 0, 0x29cf120d - 0x53);
test(instructions[33], DataSize::DWord, Operation::OR, Source::eAX, ScaleIndexBase(Source::eSI), 0, 0x1a);
test(instructions[34], DataSize::Byte, Operation::RCR, Source::Immediate, ScaleIndexBase(Source::eBP), 0x34, -0x78);
test(instructions[35], DataSize::DWord, Operation::MOVS);
// and edx,0xffffffd0
// cmc
// inc esp
// popf
test(instructions[36], DataSize::DWord, Operation::AND, Source::Immediate, Source::eDX);
test(instructions[37], DataSize::None, Operation::CMC);
test(instructions[38], DataSize::DWord, Operation::INC, Source::eSP);
test(instructions[39], DataSize::DWord, Operation::POPF);
// movs DWORD PTR es:[edi],DWORD PTR ds:[esi]
// rcr DWORD PTR [esi+0x4f],0x7
// push ecx
// aam 0xed
test(instructions[40], DataSize::DWord, Operation::MOVS);
test(instructions[41], DataSize::DWord, Operation::RCR, Source::Immediate, ScaleIndexBase(Source::eSI), 0x07, 0x4f);
test(instructions[42], DataSize::DWord, Operation::PUSH, Source::eCX);
test(instructions[43], Operation::AAM, 0xed);
// mov al,0x69
// xlat BYTE PTR ds:[ebx]
// add ch,al
// push ecx
test(instructions[44], DataSize::Byte, Operation::MOV, Source::Immediate, Source::eAX, 0x69);
test(instructions[45], Operation::XLAT);
test(instructions[46], DataSize::Byte, Operation::ADD, Source::eAX, Source::CH);
test(instructions[47], DataSize::DWord, Operation::PUSH, Source::eCX);
// sti
// push 0x698b3a85
// sub BYTE PTR [esp+ebp*8],cl
// mov cl,0xb7
test(instructions[48], Operation::STI);
test(instructions[49], DataSize::DWord, Operation::PUSH, Source::Immediate, Source::None, 0x698b3a85);
test(instructions[50], DataSize::Byte, Operation::SUB, Source::eCX, ScaleIndexBase(3, Source::eBP, Source::eSP));
test(instructions[51], DataSize::Byte, Operation::MOV, Source::Immediate, Source::eCX, 0xb7);
// cmp ecx,DWORD PTR [ebp+0x2c87445f]
// jecxz 0x00000084 (from 0x82)
// sahf
// jz 0x000000f3 (from 0x85)
test(instructions[52], DataSize::DWord, Operation::CMP, ScaleIndexBase(Source::eBP), Source::eCX, 0, 0x2c87445f);
test(instructions[53], Operation::JCXZ, 0, 0x02);
test(instructions[54], Operation::SAHF);
test(instructions[55], Operation::JZ, 0, 0x6e);
// sbb ecx,DWORD PTR [edi+0x433c54d]
// lahf
// lods al,BYTE PTR ds:[esi]
// ror cl,0x60
test(instructions[56], DataSize::DWord, Operation::SBB, ScaleIndexBase(Source::eDI), Source::eCX, 0, 0x433c54d);
test(instructions[57], Operation::LAHF);
test(instructions[58], Operation::LODS);
test(instructions[59], DataSize::Byte, Operation::ROR, Source::Immediate, Source::eCX, 0x60);
// call 0xe21b:0x97d0f58a
// fs pusha
// mov al,0xcf
// jecxz 0x000000d4 (from 0x9d)
test_far(instructions[60], Operation::CALLfar, 0xe21b, 0x97d0f58a);
test(instructions[61], Operation::PUSHA);
test(instructions[62], DataSize::Byte, Operation::MOV, Source::Immediate, Source::eAX, 0xcf);
test(instructions[63], Operation::JCXZ, 0, 0xd4 - 0x9d);
}
- (void)testSourceModRegRM1 {
const auto instructions = decode<Model::i80386>({
0x62, 0x90, 0x90, 0xdf, 0xcd, 0xf9
}, true);
XCTAssertEqual(instructions.size(), 1);
test(instructions[0], DataSize::DWord, Operation::BOUND, ScaleIndexBase(Source::eAX), Source::eDX, 0, -0x6322070);
}
- (void)testSourceModRegRM2 {
const auto instructions = decode<Model::i80386>({
0x81, 0x47, 0xbe, 0xa9, 0x3a, 0x68, 0x9f
}, true);
XCTAssertEqual(instructions.size(), 1);
test(instructions[0], DataSize::DWord, Operation::ADD, Source::Immediate, ScaleIndexBase(Source::eDI), 0x9f683aa9, -0x42);
}
- (void)test8086LengthLimit {
const std::vector<uint8_t> all_prefix(65536, 0x26);
const auto instructions = decode<Model::i8086>(all_prefix);
XCTAssertEqual(instructions.size(), 1);
test(instructions[0], Operation::NOP);
}
- (void)test286LengthLimit {
const auto instructions = decode<Model::i80286>({
0x90,
0x26, 0x90,
0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
});
XCTAssertEqual(instructions.size(), 12);
test(instructions[0], Operation::NOP);
test(instructions[1], Operation::NOP);
test(instructions[2], Operation::NOP);
test(instructions[3], Operation::NOP);
test(instructions[4], Operation::NOP);
test(instructions[5], Operation::NOP);
test(instructions[6], Operation::NOP);
test(instructions[7], Operation::NOP);
test(instructions[8], Operation::NOP);
test(instructions[9], Operation::NOP);
test(instructions[10], Operation::Invalid);
test(instructions[11], Operation::NOP);
}
- (void)test386LengthLimit {
const auto instructions = decode<Model::i80386>({
0x90,
0x26, 0x90,
0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x26, 0x90,
});
XCTAssertEqual(instructions.size(), 17);
test(instructions[0], Operation::NOP);
test(instructions[1], Operation::NOP);
test(instructions[2], Operation::NOP);
test(instructions[3], Operation::NOP);
test(instructions[4], Operation::NOP);
test(instructions[5], Operation::NOP);
test(instructions[6], Operation::NOP);
test(instructions[7], Operation::NOP);
test(instructions[8], Operation::NOP);
test(instructions[9], Operation::NOP);
test(instructions[10], Operation::NOP);
test(instructions[11], Operation::NOP);
test(instructions[12], Operation::NOP);
test(instructions[13], Operation::NOP);
test(instructions[14], Operation::NOP);
test(instructions[15], Operation::Invalid);
test(instructions[16], Operation::NOP);
}
- (void)testAddressSizeModifier {
const auto instructions = decode<Model::i80386>({
0x67, 0xf3, 0x5d, 0x67, 0x3f, 0x67, 0x5a, 0x67, 0xea, 0x17, 0xa2, 0x38, 0x0b, 0xeb, 0xbc, 0x67,
0x4c, 0x67, 0x3a, 0x1f, 0x67, 0x00, 0x8d, 0xf9, 0x43, 0x67, 0xb1, 0x7c, 0x67, 0x88, 0xd1, 0x67,
0x31, 0xed, 0x67, 0x22, 0x00, 0x67, 0x79, 0xa7, 0x67, 0x87, 0x3c, 0x67, 0xd4, 0xa2, 0x67, 0x57,
0x67, 0x02, 0x21, 0x67, 0x48, 0x67, 0x33, 0x5d, 0xd7, 0x67, 0x3c, 0xe1, 0x67, 0x91, 0x67, 0x1b,
0x84, 0x43, 0x7f, 0x67, 0x15, 0xf6, 0x06, 0x2b, 0x6d
}, true);
// Lazy: just check that the right number of operations came out.
// Since the potential issue is reading the wrong size of address, that'll do.
XCTAssertEqual(instructions.size(), 22);
}
- (void)testAddressSizeModifierSIB {
const auto instructions = decode<Model::i80386>({
// add dword ptr [bx + si + 256], eax
0x67, 0x01, 0x80, 0x00, 0x01,
// add [eax + 256], eax
0x01, 0x80, 0x00, 0x01, 0x00, 0x00
}, true);
XCTAssertEqual(instructions.size(), 2);
test(instructions[0], DataSize::DWord, Operation::ADD, Source::eAX, ScaleIndexBase(Source::eBX, Source::eSI), 0, 0x100);
test(instructions[1], DataSize::DWord, Operation::ADD, Source::eAX, ScaleIndexBase(Source::eAX), 0, 0x100);
}
@end