2017-12-28 03:21:11 +00:00
|
|
|
/*
|
|
|
|
* mos6502.dis.c
|
|
|
|
*
|
|
|
|
* Disassembly of the mos6502 machine code into an assembly notation.
|
|
|
|
*/
|
|
|
|
|
2017-12-29 23:08:25 +00:00
|
|
|
#include <stdbool.h>
|
|
|
|
|
2017-12-28 03:21:11 +00:00
|
|
|
#include "mos6502.h"
|
2017-12-29 23:08:25 +00:00
|
|
|
#include "mos6502.dis.h"
|
2017-12-28 03:21:11 +00:00
|
|
|
#include "mos6502.enums.h"
|
|
|
|
|
2017-12-29 23:08:25 +00:00
|
|
|
static vm_8bit jump_table[MOS6502_MEMSIZE];
|
|
|
|
|
2017-12-28 03:21:11 +00:00
|
|
|
static char *instruction_strings[] = {
|
|
|
|
"ADC",
|
|
|
|
"AND",
|
|
|
|
"ASL",
|
|
|
|
"BCC",
|
|
|
|
"BCS",
|
|
|
|
"BEQ",
|
|
|
|
"BIT",
|
|
|
|
"BMI",
|
|
|
|
"BNE",
|
|
|
|
"BPL",
|
|
|
|
"BRK",
|
|
|
|
"BVC",
|
|
|
|
"BVS",
|
|
|
|
"CLC",
|
|
|
|
"CLD",
|
|
|
|
"CLI",
|
|
|
|
"CLV",
|
|
|
|
"CMP",
|
|
|
|
"CPX",
|
|
|
|
"CPY",
|
|
|
|
"DEC",
|
|
|
|
"DEX",
|
|
|
|
"DEY",
|
|
|
|
"EOR",
|
|
|
|
"INC",
|
|
|
|
"INX",
|
|
|
|
"INY",
|
|
|
|
"JMP",
|
|
|
|
"JSR",
|
|
|
|
"LDA",
|
|
|
|
"LDX",
|
|
|
|
"LDY",
|
|
|
|
"LSR",
|
|
|
|
"NOP",
|
|
|
|
"ORA",
|
|
|
|
"PHA",
|
|
|
|
"PHP",
|
|
|
|
"PLA",
|
|
|
|
"PLP",
|
|
|
|
"ROL",
|
|
|
|
"ROR",
|
|
|
|
"RTI",
|
|
|
|
"RTS",
|
|
|
|
"SBC",
|
|
|
|
"SEC",
|
|
|
|
"SED",
|
|
|
|
"SEI",
|
|
|
|
"STA",
|
|
|
|
"STX",
|
|
|
|
"STY",
|
|
|
|
"TAX",
|
|
|
|
"TAY",
|
|
|
|
"TSX",
|
|
|
|
"TXA",
|
|
|
|
"TXS",
|
|
|
|
"TYA",
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Given a stream, address mode and 16-bit value, print the value out in
|
|
|
|
* the form that is expected given the address mode. The value is not
|
|
|
|
* necessarily going to truly be 16-bit; most address modes use one
|
|
|
|
* 8-bit operand. But we can contain all possible values with the 16-bit
|
|
|
|
* type.
|
|
|
|
*/
|
|
|
|
void
|
2017-12-31 05:02:30 +00:00
|
|
|
mos6502_dis_operand(mos6502 *cpu,
|
|
|
|
FILE *stream,
|
2017-12-31 04:50:23 +00:00
|
|
|
int address,
|
|
|
|
int addr_mode,
|
|
|
|
vm_16bit value)
|
2017-12-28 03:21:11 +00:00
|
|
|
{
|
2017-12-29 23:08:25 +00:00
|
|
|
int rel_address;
|
2017-12-31 04:50:23 +00:00
|
|
|
int ind_address;
|
2017-12-29 23:08:25 +00:00
|
|
|
|
2017-12-28 03:21:11 +00:00
|
|
|
switch (addr_mode) {
|
|
|
|
case ACC:
|
|
|
|
break;
|
|
|
|
case ABS:
|
|
|
|
fprintf(stream, "$%04X", value);
|
|
|
|
break;
|
|
|
|
case ABX:
|
|
|
|
fprintf(stream, "$%04X,X", value);
|
|
|
|
break;
|
|
|
|
case ABY:
|
|
|
|
fprintf(stream, "$%04X,Y", value);
|
|
|
|
break;
|
|
|
|
case IMM:
|
|
|
|
fprintf(stream, "#$%02X", value);
|
|
|
|
break;
|
|
|
|
case IMP:
|
|
|
|
break;
|
|
|
|
case IND:
|
2017-12-31 05:02:30 +00:00
|
|
|
ind_address = vm_segment_get(cpu->memory, value) << 8;
|
|
|
|
ind_address |= vm_segment_get(cpu->memory, value + 1);
|
2017-12-31 04:50:23 +00:00
|
|
|
if (jump_table[ind_address]) {
|
|
|
|
mos6502_dis_label(stream, ind_address);
|
2017-12-29 23:08:25 +00:00
|
|
|
} else {
|
|
|
|
fprintf(stream, "($%04X)", value);
|
|
|
|
}
|
2017-12-28 03:21:11 +00:00
|
|
|
break;
|
|
|
|
case IDX:
|
|
|
|
fprintf(stream, "($%02X,X)", value);
|
|
|
|
break;
|
|
|
|
case IDY:
|
|
|
|
fprintf(stream, "($%02X),Y", value);
|
|
|
|
break;
|
|
|
|
case REL:
|
2017-12-29 23:08:25 +00:00
|
|
|
rel_address = address + value;
|
|
|
|
if (value > 127) {
|
|
|
|
rel_address -= 256;
|
|
|
|
}
|
|
|
|
|
|
|
|
mos6502_dis_label(stream, rel_address);
|
2017-12-28 03:21:11 +00:00
|
|
|
break;
|
|
|
|
case ZPG:
|
|
|
|
fprintf(stream, "$%02X", value);
|
|
|
|
break;
|
|
|
|
case ZPX:
|
|
|
|
fprintf(stream, "$%02X,X", value);
|
|
|
|
break;
|
|
|
|
case ZPY:
|
|
|
|
fprintf(stream, "$%02X,Y", value);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This function will write to the stream the instruction that the given
|
|
|
|
* opcode maps to.
|
|
|
|
*/
|
|
|
|
void
|
2017-12-29 03:47:35 +00:00
|
|
|
mos6502_dis_instruction(FILE *stream, int inst_code)
|
2017-12-28 03:21:11 +00:00
|
|
|
{
|
|
|
|
// Arguably this could or should be done as fputs(), which is
|
|
|
|
// presumably a simpler output method. But, since we use fprintf()
|
|
|
|
// in other places, I think we should continue to do so. Further, we
|
|
|
|
// use a simple format string (%s) to avoid the linter's complaints
|
|
|
|
// about potential security issues.
|
|
|
|
fprintf(stream, "%s", instruction_strings[inst_code]);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This function returns the number of bytes that the given opcode is
|
|
|
|
* expecting to work with. For instance, if the opcode is in absolute
|
|
|
|
* address mode, then we will need to read the next two bytes in the
|
|
|
|
* stream to compose a full 16-bit address to work with. If our opcode
|
|
|
|
* is in immediate mode, then we only need to read one byte. Many
|
|
|
|
* opcodes will read no bytes at all from the stream (in which we return
|
|
|
|
* zero).
|
|
|
|
*/
|
|
|
|
int
|
2017-12-29 05:47:36 +00:00
|
|
|
mos6502_dis_expected_bytes(int addr_mode)
|
2017-12-28 03:21:11 +00:00
|
|
|
{
|
|
|
|
switch (addr_mode) {
|
|
|
|
// These are 16-bit operands, because they work with absolute
|
|
|
|
// addresses in memory.
|
|
|
|
case ABS:
|
|
|
|
case ABY:
|
|
|
|
case ABX:
|
|
|
|
case IND:
|
|
|
|
return 2;
|
|
|
|
|
|
|
|
// These are the 8-bit operand address modes.
|
|
|
|
case IMM:
|
|
|
|
case IDX:
|
|
|
|
case IDY:
|
|
|
|
case REL:
|
|
|
|
case ZPG:
|
|
|
|
case ZPX:
|
|
|
|
case ZPY:
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
// These two address modes have implied arguments; ACC is
|
|
|
|
// the accumulator, and IMP basically means it operates on
|
|
|
|
// some specific (presumably obvious) thing and no operand
|
|
|
|
// is necessary.
|
|
|
|
case ACC:
|
|
|
|
case IMP:
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// I don't know how we got here, outside of foul magicks and cruel
|
|
|
|
// trickery. Let's fearfully return zero!
|
|
|
|
return 0;
|
|
|
|
}
|
2017-12-29 03:47:35 +00:00
|
|
|
|
|
|
|
/*
|
2017-12-31 05:02:30 +00:00
|
|
|
* Scan memory (with a given address) and write the opcode at that
|
2017-12-29 03:47:35 +00:00
|
|
|
* point to the given file stream. This function will also write an
|
|
|
|
* operand to the file stream if one is warranted. We return the number
|
|
|
|
* of bytes consumed by scanning past the opcode and/or operand.
|
|
|
|
*/
|
|
|
|
int
|
2017-12-31 05:02:30 +00:00
|
|
|
mos6502_dis_opcode(mos6502 *cpu, FILE *stream, int address)
|
2017-12-29 03:47:35 +00:00
|
|
|
{
|
|
|
|
vm_8bit opcode;
|
|
|
|
vm_16bit operand;
|
2017-12-29 05:47:36 +00:00
|
|
|
int addr_mode;
|
2017-12-29 23:08:25 +00:00
|
|
|
int inst_code;
|
2017-12-29 03:47:35 +00:00
|
|
|
int expected;
|
|
|
|
|
|
|
|
// The next byte is assumed to be the opcode we work with.
|
2017-12-31 05:02:30 +00:00
|
|
|
opcode = vm_segment_get(cpu->memory, address);
|
2017-12-29 03:47:35 +00:00
|
|
|
|
|
|
|
// And given that opcode, we need to see how many bytes large our
|
|
|
|
// operand will be.
|
2017-12-29 05:47:36 +00:00
|
|
|
addr_mode = mos6502_addr_mode(opcode);
|
|
|
|
expected = mos6502_dis_expected_bytes(addr_mode);
|
2017-12-29 03:47:35 +00:00
|
|
|
|
2017-12-29 23:08:25 +00:00
|
|
|
// The specific instruction we mean to execute
|
|
|
|
inst_code = mos6502_instruction(opcode);
|
|
|
|
|
2017-12-29 03:47:35 +00:00
|
|
|
// The operand itself defaults to zero... in cases where this
|
|
|
|
// doesn't change, the instruction related to the opcode will
|
|
|
|
// probably not even use it.
|
|
|
|
operand = 0;
|
|
|
|
|
|
|
|
// And we need to skip ahead of the opcode.
|
|
|
|
address++;
|
|
|
|
|
|
|
|
switch (expected) {
|
|
|
|
case 2:
|
|
|
|
// If we have a two-byte operand, then the first byte is the
|
|
|
|
// MSB and our operand will need to shift it 8 positions to
|
|
|
|
// the left before it can be OR'd.
|
2017-12-31 05:02:30 +00:00
|
|
|
operand |= vm_segment_get(cpu->memory, address) << 8;
|
2017-12-29 03:47:35 +00:00
|
|
|
address++;
|
|
|
|
|
|
|
|
// Note we fall through here to the next case...
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
// If it's a one-byte operand, then this byte should occupy
|
|
|
|
// the LSB space which simply requires we OR the byte
|
|
|
|
// directly in. If this is part of a two-byte operand, then
|
|
|
|
// the same logic still applies.
|
2017-12-31 05:02:30 +00:00
|
|
|
operand |= vm_segment_get(cpu->memory, address);
|
2017-12-29 03:47:35 +00:00
|
|
|
address++;
|
|
|
|
|
|
|
|
// And, in any other case (e.g. 0), we are done; we don't
|
|
|
|
// read anything, and we leave the operand as it is.
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2017-12-29 23:08:25 +00:00
|
|
|
// If the stream is NULL, we're doing some kind of lookahead.
|
|
|
|
// Furthermore, if this is an instruction that would switch control
|
|
|
|
// to a different spot in the program, then let's label this in the
|
|
|
|
// jump table.
|
|
|
|
if (stream == NULL && mos6502_would_jump(inst_code)) {
|
2017-12-31 05:02:30 +00:00
|
|
|
mos6502_dis_jump_label(cpu, operand, address, addr_mode);
|
2017-12-29 23:08:25 +00:00
|
|
|
}
|
2017-12-29 03:47:35 +00:00
|
|
|
|
2017-12-29 23:08:25 +00:00
|
|
|
// It's totally possible that we are not expected to print out the
|
|
|
|
// contents of our inspection of the opcode. (For example, we may
|
|
|
|
// just want to set the jump table in a lookahead operation.)
|
|
|
|
if (stream) {
|
|
|
|
// Hey! We might have a label at this position in the code. If
|
|
|
|
// so, let's print out the label.
|
|
|
|
if (jump_table[address]) {
|
|
|
|
// This will print out just the label itself.
|
|
|
|
mos6502_dis_label(stream, address);
|
2017-12-29 03:47:35 +00:00
|
|
|
|
2017-12-29 23:08:25 +00:00
|
|
|
// But to actually define the label, we need a colon to
|
|
|
|
// complete the notation. (We don't _need_ a newline, but it
|
|
|
|
// looks nicer to my arbitrary sensibilities. Don't @ me!)
|
|
|
|
fprintf(stream, ":\n");
|
|
|
|
}
|
2017-12-29 03:47:35 +00:00
|
|
|
|
2017-12-29 23:08:25 +00:00
|
|
|
// Let's print out to the stream what we have so far. First, we
|
|
|
|
// indent by four spaces.
|
|
|
|
fprintf(stream, " ");
|
2017-12-29 03:47:35 +00:00
|
|
|
|
2017-12-29 23:08:25 +00:00
|
|
|
// Print out the instruction code that our opcode represents.
|
|
|
|
mos6502_dis_instruction(stream, inst_code);
|
|
|
|
|
|
|
|
if (expected) {
|
|
|
|
// Let's "tab" over; each instruction code is 3 characters, so let's
|
|
|
|
// move over 5 spaces (4 spaces indent + 1, just to keep everything
|
|
|
|
// aligned by 4-character boundaries).
|
|
|
|
fprintf(stream, " ");
|
|
|
|
|
|
|
|
// Print out the operand given the proper address mode.
|
2017-12-31 05:02:30 +00:00
|
|
|
mos6502_dis_operand(cpu, stream, address, addr_mode, operand);
|
2017-12-29 23:08:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// And let's terminate the line.
|
|
|
|
fprintf(stream, "\n");
|
|
|
|
}
|
2017-12-29 03:47:35 +00:00
|
|
|
|
|
|
|
// The expected number of bytes here is for the operand, but we need
|
|
|
|
// to add one for the opcode to return the true number that this
|
|
|
|
// opcode sequence would consume.
|
|
|
|
return expected + 1;
|
|
|
|
}
|
2017-12-29 21:31:05 +00:00
|
|
|
|
2018-01-07 22:07:29 +00:00
|
|
|
/*
|
|
|
|
* Scan the CPU memory, from a given position until a given end, and
|
|
|
|
* print the results into a given file stream.
|
|
|
|
*/
|
2017-12-29 21:31:05 +00:00
|
|
|
void
|
2017-12-31 05:02:30 +00:00
|
|
|
mos6502_dis_scan(mos6502 *cpu, FILE *stream, int pos, int end)
|
2017-12-29 21:31:05 +00:00
|
|
|
{
|
|
|
|
while (pos < end) {
|
2017-12-31 05:02:30 +00:00
|
|
|
pos += mos6502_dis_opcode(cpu, stream, pos);
|
2017-12-29 21:31:05 +00:00
|
|
|
}
|
|
|
|
}
|
2017-12-29 23:08:25 +00:00
|
|
|
|
2018-01-07 22:07:29 +00:00
|
|
|
/*
|
|
|
|
* Associate a label with a given address or operand, depending on the
|
|
|
|
* address mode. For example, with REL, the jump label will be based on
|
|
|
|
* the address but added to or subtracted with the operand. Whereas in
|
|
|
|
* IND, the address is wholly dependent on the operand.
|
|
|
|
*/
|
2017-12-29 23:08:25 +00:00
|
|
|
void
|
2017-12-31 05:02:30 +00:00
|
|
|
mos6502_dis_jump_label(mos6502 *cpu,
|
|
|
|
vm_16bit operand,
|
2017-12-31 03:48:16 +00:00
|
|
|
int address,
|
|
|
|
int addr_mode)
|
2017-12-29 23:08:25 +00:00
|
|
|
{
|
2017-12-31 03:48:16 +00:00
|
|
|
int jump_loc;
|
2017-12-29 23:08:25 +00:00
|
|
|
|
2017-12-31 03:48:16 +00:00
|
|
|
switch (addr_mode) {
|
|
|
|
// With indirect address mode, the address we want to jump to is
|
|
|
|
// not the literal operand, but a 16-bit address that is
|
|
|
|
// _pointed to_ by the address represented by the operand. Think
|
|
|
|
// of the operand as a kind of double pointer, or just re-watch
|
|
|
|
// Inception.
|
|
|
|
case IND:
|
2017-12-31 05:02:30 +00:00
|
|
|
jump_loc = vm_segment_get(cpu->memory, operand) << 8;
|
|
|
|
jump_loc |= vm_segment_get(cpu->memory, operand + 1);
|
2017-12-31 03:48:16 +00:00
|
|
|
break;
|
2017-12-29 23:08:25 +00:00
|
|
|
|
2017-12-31 03:48:16 +00:00
|
|
|
// In relative address mode, the jump location will be a
|
|
|
|
// number -- well -- relative to the address. If the 8th bit
|
|
|
|
// of the operand is 1, then we treat the number as a
|
|
|
|
// negative; otherwise, positive or zero.
|
|
|
|
case REL:
|
|
|
|
jump_loc = address + operand;
|
|
|
|
|
|
|
|
if (operand > 127) {
|
|
|
|
jump_loc -= 256;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return;
|
2017-12-29 23:08:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
jump_table[jump_loc] = 1;
|
|
|
|
}
|
|
|
|
|
2018-01-07 22:07:29 +00:00
|
|
|
/*
|
|
|
|
* Print out the form of our label to the given file stream. This is
|
|
|
|
* fairly dumb; it'll print out whatever address you give to it.
|
|
|
|
*/
|
2017-12-29 23:08:25 +00:00
|
|
|
inline void
|
|
|
|
mos6502_dis_label(FILE *stream, int address)
|
|
|
|
{
|
|
|
|
fprintf(stream, "ADDR_%d", address);
|
|
|
|
}
|
|
|
|
|
2018-01-07 22:07:29 +00:00
|
|
|
/*
|
|
|
|
* Remove the previously-set label in the jump table for a given
|
|
|
|
* address.
|
|
|
|
*/
|
2017-12-29 23:08:25 +00:00
|
|
|
inline void
|
|
|
|
mos6502_dis_jump_unlabel(int address)
|
|
|
|
{
|
|
|
|
jump_table[address] = 0;
|
|
|
|
}
|
|
|
|
|
2018-01-07 22:07:29 +00:00
|
|
|
/*
|
|
|
|
* Return true if the given address has a jump label associated with it.
|
|
|
|
*/
|
2017-12-29 23:08:25 +00:00
|
|
|
inline bool
|
|
|
|
mos6502_dis_is_jump_label(int address)
|
|
|
|
{
|
|
|
|
return jump_table[address] == 1;
|
|
|
|
}
|