1
0
mirror of https://github.com/lefticus/6502-cpp.git synced 2024-12-21 10:30:35 +00:00

Initial commit

This commit is contained in:
Jason Turner 2016-07-06 18:35:40 -06:00
commit efcb6fa7ac
3 changed files with 610 additions and 0 deletions

517
src/main.cpp Normal file
View File

@ -0,0 +1,517 @@
#include <iostream>
#include <vector>
#include <set>
#include <string>
#include <regex>
#include <cassert>
#include <map>
#include <cctype>
struct ASMLine
{
enum class Type
{
Label,
Instruction,
Directive
};
ASMLine(Type t, std::string te) : type(t), text(std::move(te)) {}
Type type;
std::string text;
};
struct Operand
{
enum class Type
{
empty,
literal,
reg /*ister*/
};
int reg_num = 0;
Type type = Type::empty;
std::string value;
Operand() = default;
Operand(const Type t, const std::string v)
: type(t), value(std::move(v))
{
assert(type == Type::literal);
}
Operand(const Type t, const int num)
: type(t), reg_num(num)
{
assert(type == Type::reg);
}
};
struct mos6502 : ASMLine
{
enum class OpCode
{
unknown,
lda,
sta,
pha,
pla,
AND,
cmp,
bne,
beq,
jmp,
adc,
sbc
};
static bool get_is_branch(const OpCode o) {
switch (o) {
case OpCode::beq:
case OpCode::bne:
return true;
case OpCode::lda:
case OpCode::sta:
case OpCode::pha:
case OpCode::pla:
case OpCode::AND:
case OpCode::cmp:
case OpCode::jmp:
case OpCode::adc:
case OpCode::sbc:
return false;
}
}
static bool get_is_comparison(const OpCode o) {
switch (o) {
case OpCode::cmp:
return true;
case OpCode::lda:
case OpCode::sta:
case OpCode::pha:
case OpCode::pla:
case OpCode::AND:
case OpCode::jmp:
case OpCode::bne:
case OpCode::beq:
case OpCode::adc:
case OpCode::sbc:
return false;
}
}
mos6502(const OpCode o)
: ASMLine(Type::Instruction, to_string(o)), opcode(o), is_branch(get_is_branch(o)), is_comparison(get_is_comparison(o))
{
}
mos6502(const Type t, const std::string s)
: ASMLine(t, std::move(s))
{
}
mos6502(const OpCode o, const Operand t_o)
: ASMLine(Type::Instruction, to_string(o)), opcode(o), op(std::move(t_o)), is_branch(get_is_branch(o)), is_comparison(get_is_comparison(o))
{
}
static std::string to_string(const OpCode o)
{
switch (o) {
case OpCode::lda:
return "\tlda";
case OpCode::sta:
return "\tsta";
case OpCode::pha:
return "\tpha";
case OpCode::pla:
return "\tpla";
case OpCode::AND:
return "\tand";
case OpCode::cmp:
return "\tcmp";
case OpCode::bne:
return "\tbne";
case OpCode::beq:
return "\tbeq";
case OpCode::jmp:
return "\tjmp";
case OpCode::adc:
return "\tadc";
case OpCode::sbc:
return "\tsbc";
case OpCode::unknown:
return "";
};
}
std::string to_string() const
{
switch (type) {
case ASMLine::Type::Label:
return text + ':';
case ASMLine::Type::Directive:
case ASMLine::Type::Instruction:
return '\t' + text + ' ' + op.value;
};
}
OpCode opcode = OpCode::unknown;
Operand op;
bool is_branch = false;
bool is_comparison = false;
};
struct i386 : ASMLine
{
enum class OpCode
{
unknown,
movzbl,
movzwl,
shrb,
xorl,
andl,
ret,
movb,
jmp,
jne,
je,
testb,
addl,
subl
};
static OpCode parse_opcode(Type t, const std::string &o)
{
switch(t)
{
case Type::Label:
return OpCode::unknown;
case Type::Directive:
return OpCode::unknown;
case Type::Instruction:
{
if (o == "movzwl") return OpCode::movzwl;
if (o == "movzbl") return OpCode::movzbl;
if (o == "shrb") return OpCode::shrb;
if (o == "xorl") return OpCode::xorl;
if (o == "andl") return OpCode::andl;
if (o == "ret") return OpCode::ret;
if (o == "movb") return OpCode::movb;
if (o == "jmp") return OpCode::jmp;
if (o == "testb") return OpCode::testb;
if (o == "jne") return OpCode::jne;
if (o == "je") return OpCode::je;
if (o == "subl") return OpCode::subl;
if (o == "addl") return OpCode::addl;
throw std::runtime_error("Unknown opcode: " + o);
}
}
}
static Operand parse_operand(std::string o)
{
if (o.empty()) {
throw std::runtime_error("Empty operand?!");
}
if (o[0] == '%') {
if (o == "%eax") {
return Operand(Operand::Type::reg, 1);
} else if (o == "%al") {
return Operand(Operand::Type::reg, 1);
} else if (o == "%di") {
return Operand(Operand::Type::reg, 6);
} else {
throw std::runtime_error("Unknown register operand: '" + o + "'");
}
} else {
return Operand(Operand::Type::literal, o);
}
}
i386(Type t, std::string o1)
: ASMLine(t, o1), opcode(parse_opcode(t, o1))
{
}
i386(Type t, std::string opcode, std::string o1)
: ASMLine(t, opcode), opcode(parse_opcode(t, opcode)), operand1(parse_operand(std::move(o1)))
{
}
i386(Type t, std::string opcode, std::string o1, std::string o2)
: ASMLine(t, opcode), opcode(parse_opcode(t, opcode)), operand1(parse_operand(std::move(o1))), operand2(parse_operand(std::move(o2)))
{
}
OpCode opcode;
Operand operand1;
Operand operand2;
};
void translate_instruction(std::vector<mos6502> &instructions, const i386::OpCode op, const Operand &o1, const Operand &o2)
{
switch(op)
{
case i386::OpCode::movb:
if (o1.type == Operand::Type::literal && o1.type == Operand::Type::literal) {
instructions.emplace_back(mos6502::OpCode::pha); // transfer memory through A register, pushing and popping around it
instructions.emplace_back(mos6502::OpCode::lda, Operand(o1.type, "#" + o1.value));
instructions.emplace_back(mos6502::OpCode::sta, o2);
instructions.emplace_back(mos6502::OpCode::pla);
} else if (o1.type == Operand::Type::reg && o1.reg_num == 1 && o2.type == Operand::Type::literal) {
instructions.emplace_back(mos6502::OpCode::sta, o2);
} else {
throw std::runtime_error("Cannot translate instruction");
}
break;
case i386::OpCode::movzbl:
if (o1.type == Operand::Type::literal && o2.type == Operand::Type::reg && o2.reg_num == 1) {
instructions.emplace_back(mos6502::OpCode::lda, o1);
} else {
throw std::runtime_error("Cannot translate instruction");
}
break;
case i386::OpCode::testb:
if (o1.type == Operand::Type::literal && o2.type == Operand::Type::reg && o2.reg_num == 1) {
instructions.emplace_back(mos6502::OpCode::AND, Operand(o1.type, "#" + o1.value));
instructions.emplace_back(mos6502::OpCode::cmp, Operand(Operand::Type::literal, "#$0"));
} else {
throw std::runtime_error("Cannot translate instruction");
}
break;
case i386::OpCode::jne:
instructions.emplace_back(mos6502::OpCode::bne, o1);
break;
case i386::OpCode::je:
instructions.emplace_back(mos6502::OpCode::beq, o1);
break;
case i386::OpCode::jmp:
instructions.emplace_back(mos6502::OpCode::jmp, o1);
break;
case i386::OpCode::addl:
if (o1.type == Operand::Type::literal && o2.type == Operand::Type::reg && o2.reg_num == 1) {
instructions.emplace_back(mos6502::OpCode::adc, Operand(o1.type, "#" + o1.value));
} else {
throw std::runtime_error("Cannot translate instruction");
}
break;
case i386::OpCode::subl:
if (o1.type == Operand::Type::literal && o2.type == Operand::Type::reg && o2.reg_num == 1) {
instructions.emplace_back(mos6502::OpCode::sbc, Operand(o1.type, "#" + o1.value));
} else {
throw std::runtime_error("Cannot translate instruction");
}
break;
default:
throw std::runtime_error("Cannot translate instruction");
};
}
void to_mos6502(const i386 &i, std::vector<mos6502> &instructions)
{
switch(i.type)
{
case ASMLine::Type::Label:
instructions.emplace_back(i.type, i.text);
return;
case ASMLine::Type::Directive:
throw std::runtime_error("Directives not understood during translation");
case ASMLine::Type::Instruction:
translate_instruction(instructions, i.opcode, i.operand1, i.operand2);
return;
}
}
bool fix_overwritten_flags(std::vector<mos6502> &instructions)
{
if (instructions.size() < 3) {
return false;
}
for (size_t op = 0; op < instructions.size() - 2; ++op)
{
if (instructions[op].is_comparison
&& !instructions[op + 1].is_comparison
&& !instructions[op + 1].is_branch
&& instructions[op + 2].is_branch) {
const auto opcode_to_duplicate = op + 1;
const auto new_pos_1 = op + 3;
const auto new_pos_2 = [&instructions, branch = instructions[op + 2].op.value](){
for (size_t cur_op = 0; cur_op < instructions.size(); ++cur_op) {
if (instructions[cur_op].type == ASMLine::Type::Label
&& instructions[cur_op].text == branch) {
return cur_op + 1;
}
}
throw std::runtime_error("Unable to find matching branch!");
}();
instructions.insert(std::next(std::begin(instructions), std::max(new_pos_1, new_pos_2)), instructions[opcode_to_duplicate]);
instructions.insert(std::next(std::begin(instructions), std::min(new_pos_1, new_pos_2)), instructions[opcode_to_duplicate]);
instructions.erase(std::next(std::begin(instructions), opcode_to_duplicate));
return true;
}
}
return false;
}
int main()
{
std::regex Label(R"(^(\S+):)");
std::regex Directive(R"(^\t(\..+))");
std::regex UnaryInstruction(R"(^\t(\S+)\s+(\S+))");
std::regex BinaryInstruction(R"(^\t(\S+)\s+(\S+),\s+(\S+))");
std::regex Instruction(R"(^\t(\S+))");
int lineno = 0;
std::vector<i386> instructions;
while (std::cin.good())
{
std::string line;
getline(std::cin, line);
std::smatch match;
if (std::regex_match(line, match, Label))
{
instructions.emplace_back(ASMLine::Type::Label, match[1]);
} else if (std::regex_match(line, match, Directive)) {
instructions.emplace_back(ASMLine::Type::Directive, match[1]);
} else if (std::regex_match(line, match, UnaryInstruction)) {
instructions.emplace_back(ASMLine::Type::Instruction, match[1], match[2]);
} else if (std::regex_match(line, match, BinaryInstruction)) {
instructions.emplace_back(ASMLine::Type::Instruction, match[1], match[2], match[3]);
} else if (std::regex_match(line, match, Instruction)) {
instructions.emplace_back(ASMLine::Type::Instruction, match[1]);
} else if (line == "") {
//std::cout << "EmptyLine\n";
} else {
throw std::runtime_error("Unparsed Input, Line: " + std::to_string(lineno));
}
++lineno;
}
std::set<std::string> labels;
for (const auto i : instructions)
{
if (i.type == ASMLine::Type::Label) {
labels.insert(i.text);
}
}
std::set<std::string> used_labels{"main"};
for (const auto i : instructions)
{
if (i.type == ASMLine::Type::Instruction)
{
if (labels.count(i.operand1.value) != 0) {
used_labels.insert(i.operand1.value);
}
if (labels.count(i.operand2.value) != 0) {
used_labels.insert(i.operand2.value);
}
}
}
// remove all labels and directives that we don't need
instructions.erase(
std::remove_if(std::begin(instructions), std::end(instructions),
[&used_labels](const auto &i){
if (i.type == ASMLine::Type::Directive) return true;
if (i.type == ASMLine::Type::Label) {
if (used_labels.count(i.text) == 0) {
// remove all unused labels that aren't 'main'
return true;
}
}
return false;
}
),
std::end(instructions)
);
// remove everything up to the first label
// this will probably leave some dead code around at some point
// but it's a start
instructions.erase(
std::begin(instructions),
std::find_if(std::begin(instructions),
std::end(instructions),
[](const auto &i){ return i.type == ASMLine::Type::Label; }
)
);
const auto new_labels =
[&used_labels](){
std::map<std::string, std::string> result;
for (const auto &l : used_labels) {
auto newl = l;
std::transform(newl.begin(), newl.end(), newl.begin(), [](const auto c) { return std::tolower(c); });
newl.erase(std::remove_if(newl.begin(), newl.end(), [](const auto c){ return !std::isalnum(c); }), std::end(newl));
std::cout << "Old label: '" << l << "' new label: '" << newl << "'\n";
result.emplace(std::make_pair(l, newl));
}
return result;
}();
for (auto &i : instructions)
{
if (i.type == ASMLine::Type::Label)
{
std::cout << "Updating label " << i.text << '\n';;
i.text = new_labels.at(i.text);
}
const auto itr1 = new_labels.find(i.operand1.value);
if (itr1 != new_labels.end()) {
i.operand1.value = itr1->second;
}
const auto itr2 = new_labels.find(i.operand2.value);
if (itr2 != new_labels.end()) {
i.operand1.value = itr2->second;
}
}
std::vector<mos6502> new_instructions;
for (const auto &i : instructions)
{
to_mos6502(i, new_instructions);
}
while (fix_overwritten_flags(new_instructions))
{
// do it however many times it takes
}
for (const auto i : new_instructions)
{
std::cout << i.to_string() << '\n';
}
}

44
test/test.cpp Normal file
View File

@ -0,0 +1,44 @@
#include <cstdint>
enum class Colors : uint8_t
{
WHITE=0x01
};
volatile uint8_t &memory_loc(const uint16_t loc)
{
return *reinterpret_cast<volatile uint8_t *>(loc);
}
void decrement_border_color()
{
--memory_loc(0xd020);
}
void increment_border_color()
{
++memory_loc(0xd020);
}
bool joystick_down()
{
uint8_t joystick_state = memory_loc(0xDC00);
return (joystick_state & 0x2) == 0;
}
int main()
{
const auto background_color = [](Colors col) {
memory_loc(0xd021) = static_cast<uint8_t>(col);
};
background_color(Colors::WHITE);
while(true) {
if (joystick_down()) {
increment_border_color();
} else {
decrement_border_color();
}
}
}

49
test/test2.cpp Normal file
View File

@ -0,0 +1,49 @@
#include <cstdint>
enum class Colors : uint8_t
{
WHITE=0x01,
BLACK=0x00
};
volatile uint8_t &memory_loc(const uint16_t loc)
{
return *reinterpret_cast<volatile uint8_t *>(loc);
}
void decrement_border_color()
{
--memory_loc(0xd020);
}
void increment_border_color()
{
++memory_loc(0xd020);
}
bool joystick_down()
{
uint8_t joystick_state = memory_loc(0xDC00);
return (joystick_state & 0x2) == 0;
}
int main()
{
const auto background_color = [](Colors col) {
memory_loc(0xd021) = static_cast<uint8_t>(col);
};
const auto border_color = [](Colors col) {
memory_loc(0xd020) = static_cast<uint8_t>(col);
};
background_color(Colors::WHITE);
while(true) {
if (joystick_down()) {
border_color(Colors::WHITE);
} else {
border_color(Colors::BLACK);
}
}
}