allSections; std::vector externals; // external labels organized by object file MapSymbolArray map; // CPU target struct mnem *opcode_table; int opcode_count; CPUIndex cpu, list_cpu; OPLookup aInstructions[MAX_OPCODES_DIRECTIVES]; int num_instructions; int default_org; // context for macros / include files ContextStack contextStack; // Current section Section *current_section; // Special syntax rules AsmSyntax syntax; // Conditional assembly vars int conditional_depth; // conditional depth / base depth for context strref conditional_source[MAX_CONDITIONAL_DEPTH]; // start of conditional for error report int8_t conditional_nesting[MAX_CONDITIONAL_DEPTH]; bool conditional_consumed[MAX_CONDITIONAL_DEPTH]; // Scope info int scope_address[MAX_SCOPE_DEPTH]; int scope_depth; int brace_depth; // scope depth defined only by braces, not files // Eval relative result (only valid if EvalExpression returns STATUS_RELATIVE_SECTION) int lastEvalSection; int lastEvalValue; int8_t lastEvalShift; strref export_base_name; // binary output name if available strref last_label; // most recently defined label for Merlin macro int8_t list_flags; // listing flags accumulating for each line bool accumulator_16bit; // 65816 specific software dependent immediate mode bool index_reg_16bit; // -"- int8_t cycle_counter_level; // merlin toggles the cycle counter rather than hierarchically evals bool error_encountered; // if any error encountered, don't export binary bool list_assembly; // generate assembler listing bool end_macro_directive; // whether to use { } or macro / endmacro for macro scope // Convert source to binary void Assemble(strref source, strref filename, bool obj_target); // Push a new context and handle enter / exit of context StatusCode PushContext(strref src_name, strref src_file, strref code_seg, int rept = 1); StatusCode PopContext(); // Generate assembler listing if requested bool List(strref filename); // Generate source for all valid instructions and addressing modes for current CPU bool AllOpcodes(strref filename); // Clean up memory allocations, reset assembler state void Cleanup(); // Make sure there is room to write more code StatusCode CheckOutputCapacity(uint32_t addSize); // Operations on current section void SetSection(strref name, int address); // fixed address section void SetSection(strref name); // relative address section void LinkLabelsToAddress(int section_id, int section_new, int section_address); StatusCode LinkRelocs(int section_id, int section_new, int section_address); StatusCode AssignAddressToSection(int section_id, int address); StatusCode LinkSections(strref name); // link relative address sections with this name here StatusCode MergeSections(int section_id, int section_merge); // Combine the result of a section onto another StatusCode MergeSectionsByName(int first_section); StatusCode MergeAllSections(int first_section); void DummySection(int address); // non-data section (fixed) void DummySection(); // non-data section (relative) void EndSection(); // pop current section Section& CurrSection() { return *current_section; } void AssignAddressToGroup(); // Merlin LNK support uint8_t* BuildExport(strref append, int &file_size, int &addr); int GetExportNames(strref *aNames, int maxNames); StatusCode LinkZP(); int SectionId() { return int(current_section - &allSections[0]); } int SectionId(Section &s) { return (int)(&s - &allSections[0]); } void AddByte(int b) { CurrSection().AddByte(b); } void AddWord(int w) { CurrSection().AddWord(w); } void AddTriple(int l) { CurrSection().AddTriple(l); } void AddBin(const uint8_t *p, int size) { CurrSection().AddBin(p, size); } // Object file handling StatusCode WriteObjectFile(strref filename); // write x65 object file StatusCode ReadObjectFile(strref filename, int link_to_section = -1); // read x65 object file // Apple II GS OMF StatusCode WriteA2GS_OMF(strref filename, bool full_collapse); // Scope management StatusCode EnterScope(); StatusCode ExitScope(); // Macro management StatusCode AddMacro(strref macro, strref source_name, strref source_file, strref &left); StatusCode BuildMacro(Macro &m, strref arg_list); // Structs StatusCode BuildStruct(strref name, strref declaration); StatusCode EvalStruct(strref name, int &value); StatusCode BuildEnum(strref name, strref declaration); // Calculate a value based on an expression. EvalOperator RPNToken_Merlin(strref &expression, const struct EvalContext &etx, EvalOperator prev_op, int16_t §ion, int &value); EvalOperator RPNToken(strref &expression, const struct EvalContext &etx, EvalOperator prev_op, int16_t §ion, int &value, strref &subexp); StatusCode EvalExpression(strref expression, const struct EvalContext &etx, int &result); void SetEvalCtxDefaults(struct EvalContext &etx); int ReptCnt() const; // Access labels Label* GetLabel(strref label); Label* GetLabel(strref label, int file_ref); Label* AddLabel(uint32_t hash); bool MatchXDEF(strref label); StatusCode AssignLabel(strref label, strref line, bool make_constant = false); StatusCode AddressLabel(strref label); void LabelAdded(Label *pLabel, bool local = false); StatusCode IncludeSymbols(strref line); // Strings StringSymbol *GetString(strref string_name); StringSymbol *AddString(strref string_name, strref string_value); StatusCode StringAction(StringSymbol *pStr, strref line); StatusCode ParseStringOp(StringSymbol *pStr, strref line); // Manage locals void MarkLabelLocal(strref label, bool scope_label = false); StatusCode FlushLocalLabels(int scope_exit = -1); // Label pools LabelPool* GetLabelPool(strref pool_name); StatusCode AddLabelPool(strref name, strref args); StatusCode AssignPoolLabel(LabelPool &pool, strref args); // Late expression evaluation void AddLateEval(int target, int pc, int scope_pc, strref expression, strref source_file, LateEval::Type type); void AddLateEval(strref label, int pc, int scope_pc, strref expression, LateEval::Type type); StatusCode CheckLateEval(strref added_label = strref(), int scope_end = -1, bool missing_is_error = false); // Assembler Directives StatusCode ApplyDirective(AssemblerDirective dir, strref line, strref source_file); StatusCode Directive_Rept(strref line); StatusCode Directive_Macro(strref line); StatusCode Directive_String(strref line); StatusCode Directive_Undef(strref line); StatusCode Directive_Include(strref line); StatusCode Directive_Incbin(strref line, int skip=0, int len=0); StatusCode Directive_Import(strref line); StatusCode Directive_ORG(strref line); StatusCode Directive_LOAD(strref line); StatusCode Directive_MERGE(strref line); StatusCode Directive_LNK(strref line); StatusCode Directive_XDEF(strref line); StatusCode Directive_XREF(strref label); StatusCode Directive_DC(strref line, int width, strref source_file); StatusCode Directive_DS(strref line); StatusCode Directive_ALIGN(strref line); StatusCode Directive_EVAL(strref line); StatusCode Directive_HEX(strref line); StatusCode Directive_ENUM_STRUCT(strref line, AssemblerDirective dir); // Assembler steps StatusCode GetAddressMode(strref line, bool flipXY, uint32_t validModes, AddrMode &addrMode, int &len, strref &expression); StatusCode AddOpcode(strref line, int index, strref source_file); StatusCode BuildLine(strref line); StatusCode BuildSegment(); // Display error in stderr void PrintError(strref line, StatusCode error); // Conditional Status bool ConditionalAsm(); // Assembly is currently enabled bool NewConditional(); // Start a new conditional block void CloseConditional(); // Close a conditional block void CheckConditionalDepth(); // Check if this conditional will nest the assembly (a conditional is already consumed) void ConsumeConditional(); // This conditional block is going to be assembled, mark it as consumed bool ConditionalConsumed(); // Has a block of this conditional already been assembled? void SetConditional(); // This conditional block is not going to be assembled so mark that it is nesting bool ConditionalAvail(); // Returns true if this conditional can be consumed void ConditionalElse(); // Conditional else that does not enable block void EnableConditional(bool enable); // This conditional block is enabled and the prior wasn't // Conditional statement evaluation (A==B? A?) StatusCode EvalStatement(strref line, bool &result); // Add include folder void AddIncludeFolder(strref path); char* LoadText(strref filename, size_t &size); char* LoadBinary(strref filename, size_t &size); // Change CPU void SetCPU(CPUIndex CPU); // Syntax bool Merlin() const { return syntax == SYNTAX_MERLIN; } // constructor Asm() : opcode_table(opcodes_6502), opcode_count(num_opcodes_6502), num_instructions(0), cpu(CPU_6502), list_cpu(CPU_6502) { Cleanup(); localLabels.reserve(256); loadedData.reserve(16); lateEval.reserve(64); } }; // Clean up work allocations void Asm::Cleanup() { for (std::vector::iterator i = loadedData.begin(); i != loadedData.end(); ++i) { if (char *data = *i) free(data); } map.clear(); labelPools.clear(); loadedData.clear(); labels.clear(); macros.clear(); allSections.clear(); for (uint32_t i = 0; i < strings.count(); ++i) { StringSymbol &str = strings.getValue(i); if (str.string_value.cap()) free(str.string_value.charstr()); } strings.clear(); for (std::vector::iterator exti = externals.begin(); exti !=externals.end(); ++exti) exti->labels.clear(); externals.clear(); // this section is relocatable but is assigned address $1000 if exporting without directives SetSection(strref("default,code")); current_section = &allSections[0]; syntax = SYNTAX_SANE; default_org = 0x1000; scope_depth = 0; brace_depth = 0; conditional_depth = 0; conditional_nesting[0] = 0; conditional_consumed[0] = false; error_encountered = false; list_assembly = false; end_macro_directive = false; accumulator_16bit = false; // default 65816 8 bit immediate mode index_reg_16bit = false; // other CPUs won't be affected. cycle_counter_level = 0; } int sortHashLookup(const void *A, const void *B) { const OPLookup *_A = (const OPLookup*)A; const OPLookup *_B = (const OPLookup*)B; return _A->op_hash > _B->op_hash ? 1 : -1; } int BuildInstructionTable(OPLookup *pInstr, struct mnem *opcodes, int count, const char **aliases, bool merlin) { // create an instruction table (mnemonic hash lookup) int numInstructions = 0; for (int i = 0; i < count; i++) { OPLookup &op = pInstr[numInstructions++]; op.op_hash = strref(opcodes[i].instr).fnv1a_lower(); op.index = (uint8_t)i; op.type = OT_MNEMONIC; } // add instruction aliases if (aliases) { while (*aliases) { strref orig(*aliases++); strref alias(*aliases++); for (int o=0; o list_cpu) list_cpu = cpu; opcode_table = aCPUs[CPU].opcodes; opcode_count = aCPUs[CPU].num_opcodes; num_instructions = BuildInstructionTable(aInstructions, opcode_table, opcode_count, aCPUs[CPU].aliases, Merlin()); } // Read in text data (main source, include, etc.) char* Asm::LoadText(strref filename, size_t &size) { strown<512> file(filename); std::vector::iterator i = includePaths.begin(); for (;;) { if (FILE *f = fopen(file.c_str(), "rb")) { // rb is intended here since OS fseek(f, 0, SEEK_END); // eol conversion can do ugly things size_t _size = ftell(f); fseek(f, 0, SEEK_SET); if (char *buf = (char*)calloc(_size, 1)) { fread(buf, _size, 1, f); fclose(f); size = _size; return buf; } fclose(f); } if (i==includePaths.end()) break; file.copy(*i); if (file.get_last()!='/' && file.get_last()!='\\') file.append('/'); file.append(filename); ++i; } size = 0; return nullptr; } // Read in binary data (incbin) char* Asm::LoadBinary(strref filename, size_t &size) { strown<512> file(filename); std::vector::iterator i = includePaths.begin(); for (;;) { if (FILE *f = fopen(file.c_str(), "rb")) { fseek(f, 0, SEEK_END); size_t _size = ftell(f); fseek(f, 0, SEEK_SET); if (char *buf = (char*)malloc(_size)) { fread(buf, _size, 1, f); fclose(f); size = _size; return buf; } fclose(f); } if (i==includePaths.end()) break; file.copy(*i); if (file.get_last()!='/' && file.get_last()!='\\') file.append('/'); file.append(filename); #ifdef WIN32 file.replace('/', '\\'); #endif ++i; } size = 0; return nullptr; } // Create a new section with a fixed address void Asm::SetSection(strref name, int address) { if (name) { for (std::vector

::iterator i = allSections.begin(); i!=allSections.end(); ++i) { if (i->name && name.same_str(i->name)) { current_section = &*i; return; } } } if (allSections.size()==allSections.capacity()) { allSections.reserve(allSections.size()+16); } Section newSection(name, address); // don't compile over zero page and stack frame (may be bad assumption) if (address<0x200) { newSection.SetDummySection(true); } allSections.push_back(newSection); current_section = &allSections[allSections.size()-1]; } void Asm::SetSection(strref line) { if (allSections.size()&&CurrSection().unused()) { allSections.erase(allSections.begin()+SectionId()); } if (allSections.size()==allSections.capacity()) { allSections.reserve(allSections.size()+16); } SectionType type = ST_UNDEFINED; if (line.get_first() == '.') { // SEG.U etc. ++line; switch (strref::tolower(line.get_first())) { case 'u': type = ST_BSS; break; case 'z': type = ST_ZEROPAGE; break; case 'd': type = ST_DATA; break; case 'c': type = ST_CODE; break; } } line.trim_whitespace(); int align = 1; strref name; while (strref arg = line.split_token_any_trim(",:")) { if (arg.get_first() == '$') { ++arg; align = (int)arg.ahextoui(); } else if (arg.is_number()) { align = (int)arg.atoi(); } else if (arg.get_first()=='"') { name = (arg+1).before_or_full('"'); } else if (!name) { name = arg; } else if (arg.same_str("code")) { type = ST_CODE; } else if (arg.same_str("data")) { type = ST_DATA; } else if (arg.same_str("bss")) { type = ST_BSS; } else if (arg.same_str("zp")||arg.same_str("dp")|| arg.same_str("zeropage")||arg.same_str("direct")) { type = ST_ZEROPAGE; } } if (type == ST_UNDEFINED) { if (name.find("code")>=0) { type = ST_CODE; } else if (name.find("data")>=0) { type = ST_DATA; } else if (name.find("bss") >= 0 || name.same_str("directpage_stack")) type = ST_BSS; else if (name.find("zp")>=0||name.find("zeropage")>=0||name.find("direct")>=0) { type = ST_ZEROPAGE; } else { type = ST_CODE; } } Section newSection(name); newSection.align_address = align; newSection.type = type; allSections.push_back(newSection); current_section = &allSections[allSections.size()-1]; } // Fixed address dummy section void Asm::DummySection(int address) { if (allSections.size()==allSections.capacity()) { allSections.reserve(allSections.size()+16); } Section newSection(strref(), address); newSection.SetDummySection(true); allSections.push_back(newSection); current_section = &allSections[allSections.size()-1]; } // Current address dummy section void Asm::DummySection() { DummySection(CurrSection().GetPC()); } void Asm::EndSection() { int section = SectionId(); if (section) { current_section = &allSections[section-1]; } } // Iterate through the current group of sections and assign addresses if this section is fixed // This is to handle the special linking of Merlin where sections are brought together pre-export void Asm::AssignAddressToGroup() { Section &curr = CurrSection(); if (!curr.address_assigned) { return; } // Put in all the sections cared about into either the fixed sections or the relative sections std::vector FixedExport; std::vector RelativeExport; int seg = SectionId(); while (seg>=0) { Section &s = allSections[seg]; if (s.address_assigned && s.type != ST_ZEROPAGE && s.start_address >= curr.start_address) { bool inserted = false; for (std::vector::iterator i = FixedExport.begin(); i!=FixedExport.end(); ++i) { if (s.start_address < (*i)->start_address) { FixedExport.insert(i, &s); inserted = true; break; } } if (!inserted) { FixedExport.push_back(&s); } } else if (!s.address_assigned && s.type != ST_ZEROPAGE) { RelativeExport.push_back(&s); s.export_append = curr.export_append; } seg = allSections[seg].next_group; } // in this case each block should be added individually in order of code / data / bss for (int type = ST_CODE; type <= ST_BSS; type++) { std::vector::iterator i = RelativeExport.begin(); while (i!=RelativeExport.end()) { Section *pSec = *i; if (pSec->type == type) { int bytes = pSec->address - pSec->start_address; size_t insert_after = FixedExport.size()-1; for (size_t p = 0; paddress; int start_next = FixedExport[p+1]->start_address; int avail = start_next - end_prev; if (avail >= bytes) { int addr = end_prev; addr += pSec->align_address <= 1 ? 0 : (pSec->align_address - (addr % pSec->align_address)) % pSec->align_address; if ((addr + bytes) <= start_next) { insert_after = p; break; } } } int address = FixedExport[insert_after]->address; address += pSec->align_address <= 1 ? 0 : (pSec->align_address - (address % pSec->align_address)) % pSec->align_address; AssignAddressToSection(SectionId(*pSec), address); FixedExport.insert((FixedExport.begin() + insert_after + 1), pSec); i = RelativeExport.erase(i); } else { ++i; } } } } // list all export append names // for each valid export append name build a binary fixed address code // - find lowest and highest address // - alloc & 0 memory // - any matching relative sections gets linked in after // - go through all section that matches export_append in order and copy over memory uint8_t* Asm::BuildExport(strref append, int &file_size, int &addr) { int start_address = 0x7fffffff; int end_address = 0; bool has_relative_section = false; bool has_fixed_section = false; int first_link_section = -1; std::vector FixedExport; // automatically merge sections with the same name and type if one is relative and other is fixed for (size_t section_id = 0; section_id!=allSections.size(); ++section_id) { const Section §ion = allSections[section_id]; if (!section.IsMergedSection()&&!section.IsRelativeSection()) { for (size_t section_merge_id = 0; section_merge_id!=allSections.size(); ++section_merge_id) { const Section §ion_merge = allSections[section_merge_id]; if(!section_merge.IsMergedSection()&§ion_merge.IsRelativeSection() && section_merge.type == section.type && section.name.same_str_case(section_merge.name)) { MergeSections((int)section_id, (int)section_merge_id); } } } } // link any relocs to sections that are fixed for (size_t section_id = 0; section_id!=allSections.size(); ++section_id) { const Section §ion = allSections[section_id]; if(!section.IsMergedSection()&&!section.IsRelativeSection()) { LinkRelocs((int)section_id, -1, section.start_address); } } // find address range while (!has_relative_section && !has_fixed_section) { int section_id = 0; for (std::vector

::iterator i = allSections.begin(); i != allSections.end(); ++i) { if (((!append && !i->export_append) || append.same_str_case(i->export_append)) && i->type != ST_ZEROPAGE) { if (!i->IsMergedSection()) { if (i->IsRelativeSection()) { // prioritize code over data, local code over included code for initial binary segment if ((i->type == ST_CODE || i->type == ST_DATA) && i->first_group < 0 && (first_link_section < 0 || (i->type == ST_CODE && (allSections[first_link_section].type == ST_DATA || (!i->include_from && allSections[first_link_section].include_from))))) first_link_section = SectionId(*i); has_relative_section = true; } else if (i->start_address >= 0x100 && ( i->size() > 0 || i->addr_size() > 0 ) ) { has_fixed_section = true; bool inserted = false; for (std::vector::iterator f = FixedExport.begin(); f != FixedExport.end(); ++f) { if ((*f)->start_address > i->start_address) { FixedExport.insert(f, &*i); inserted = true; break; } } if (!inserted) FixedExport.push_back(&*i); if (i->start_address < start_address) start_address = i->start_address; if ((i->start_address + (int)i->size()) > end_address) { end_address = i->start_address + (int)i->size(); } } } } section_id++; } if (!has_relative_section && !has_fixed_section) return nullptr; if (has_relative_section) { if (!has_fixed_section) { // there is not a fixed section so go through and assign addresses to all sections // starting with the first reasonable section start_address = default_org; if (first_link_section<0) { return nullptr; } while (first_link_section >= 0) { FixedExport.push_back(&allSections[first_link_section]); AssignAddressToSection(first_link_section, start_address); start_address = allSections[first_link_section].address; first_link_section = allSections[first_link_section].next_group; } } // First link code sections, then data sections, then BSS sections for (int sectype = ST_CODE; sectype <= ST_BSS; sectype++) { // there are fixed sections so fit all relative sections after or inbetween fixed sections in export group for (std::vector

::iterator i = allSections.begin(); i != allSections.end(); ++i) { if (sectype == i->type && ((!append && !i->export_append) || append.same_str_case(i->export_append))) { int id = (int)(&*i - &allSections[0]); if (i->IsRelativeSection() && i->first_group < 0) { // try to fit this section in between existing sections if possible int insert_after = (int)FixedExport.size()-1; for (int f = 0; f < insert_after; f++) { int start_block = FixedExport[f]->address; int end_block = FixedExport[f + 1]->start_address; if ((end_block - start_block) >= (i->address - i->start_address)) { int addr_block = start_block; int sec = id; while (sec >= 0) { Section &s = allSections[sec]; addr_block += s.align_address <= 1 ? 0 : (s.align_address - (addr_block % s.align_address)) % s.align_address; addr_block += s.address - s.start_address; sec = s.next_group; } if (addr_block <= end_block) { insert_after = f; break; } } } int sec = id; start_address = FixedExport[insert_after]->address; while (sec >= 0) { insert_after++; if (insert_after<(int)FixedExport.size()) { FixedExport.insert(FixedExport.begin()+insert_after, &allSections[sec]); } else { FixedExport.push_back(&allSections[sec]); } AssignAddressToSection(sec, start_address); start_address = allSections[sec].address; sec = allSections[sec].next_group; } } } } } } } // get memory for output buffer start_address = FixedExport[0]->start_address; int last_data_export = (int)(FixedExport.size() - 1); while (last_data_export>0&&FixedExport[last_data_export]->type==ST_BSS) { last_data_export--; } end_address = FixedExport[last_data_export]->address; uint8_t *output = (uint8_t*)calloc(1, end_address - start_address); // copy over in order for (std::vector

::iterator i = allSections.begin(); i != allSections.end(); ++i) { if (((!append && !i->export_append) || append.same_str_case(i->export_append)) && i->type != ST_ZEROPAGE) { if (i->merged_offset==-1&&i->start_address>=0x200&&i->size()>0) { memcpy(output+i->start_address-start_address, i->output, i->size()); } } } printf("Linker export + \"" STRREF_FMT "\" summary:\n", STRREF_ARG(append)); for (std::vector::iterator f = FixedExport.begin(); f != FixedExport.end(); ++f) { if ((*f)->include_from) { printf("* $%04x-$%04x: " STRREF_FMT " (%d) included from " STRREF_FMT "\n", (*f)->start_address, (*f)->address, STRREF_ARG((*f)->name), (int)(*f - &allSections[0]), STRREF_ARG((*f)->include_from)); } else { printf("* $%04x-$%04x: " STRREF_FMT " (%d)\n", (*f)->start_address, (*f)->address, STRREF_ARG((*f)->name), (int)(*f - &allSections[0])); } } // return the result file_size = end_address - start_address; addr = start_address; return output; } // Collect all the export names int Asm::GetExportNames(strref *aNames, int maxNames) { int count = 0; for (std::vector

::iterator i = allSections.begin(); i != allSections.end(); ++i) { if (!i->IsMergedSection()) { bool found = false; uint32_t hash = i->export_append.fnv1a_lower(); for (int n = 0; n < count; n++) { if (aNames[n].fnv1a_lower() == hash) { found = true; break; } } if (!found && countexport_append; } } } return count; } // Collect all unassigned ZP sections and link them StatusCode Asm::LinkZP() { uint8_t min_addr = 0xff, max_addr = 0x00; int num_addr = 0; bool has_assigned = false, has_unassigned = false; int first_unassigned = -1; // determine if any zeropage section has been asseigned for (std::vector

::iterator s = allSections.begin(); s!=allSections.end(); ++s) { if (s->type==ST_ZEROPAGE&&!s->IsMergedSection()) { if (s->address_assigned) { has_assigned = true; if (s->start_address<(int)min_addr) { min_addr = (uint8_t)s->start_address; } else if ((int)s->address>max_addr) { max_addr = (uint8_t)s->address; } } else { has_unassigned = true; first_unassigned = first_unassigned>=0 ? first_unassigned : (int)(&*s-&allSections[0]); } num_addr += s->address-s->start_address; } } if (num_addr>0x100) { return ERROR_ZEROPAGE_SECTION_OUT_OF_RANGE; } // no unassigned zp section, nothing to fix if (!has_unassigned) { return STATUS_OK; } StatusCode status = STATUS_OK; if (!has_assigned) { // no section assigned => fit together at end int address = 0x100 - num_addr; for (std::vector

::iterator s = allSections.begin(); status==STATUS_OK && s != allSections.end(); ++s) { if (s->type == ST_ZEROPAGE && !s->IsMergedSection()) { status = AssignAddressToSection((int)(&*s - &allSections[0]), address); address = s->address; } } } else { // find first fit neighbouring an address assigned zero page section for (std::vector

::iterator s = allSections.begin(); s != allSections.end(); ++s) { if (s->type == ST_ZEROPAGE && !s->IsMergedSection() && !s->address_assigned) { int size = s->address - s->start_address; bool found = false; // find any assigned address section and try to place before or after for (std::vector

::iterator sa = allSections.begin(); sa != allSections.end(); ++sa) { if (sa->type == ST_ZEROPAGE && !sa->IsMergedSection() && sa->address_assigned) { for (int e = 0; e < 2; ++e) { int start = e ? sa->start_address - size : sa->address; int align_size = s->align_address <= 1 ? 0 : (s->align_address - (start % s->align_address)) % s->align_address; start += align_size; int end = start + size; if (start >= 0 && end <= 0x100) { for (std::vector

::iterator sc = allSections.begin(); !found && sc != allSections.end(); ++sc) { found = true; if (&*sa != &*sc && sc->type == ST_ZEROPAGE && !sc->IsMergedSection() && sc->address_assigned) { if (start <= sc->address && sc->start_address <= end) found = false; } } } if (found) { AssignAddressToSection((int)(&*s-&allSections[0]), start); } } } } if (!found) { return ERROR_ZEROPAGE_SECTION_OUT_OF_RANGE; } } } } return status; } // Apply labels assigned to addresses in a relative section a fixed address or as part of another section void Asm::LinkLabelsToAddress(int section_id, int section_new, int section_address) { Label *pLabels = labels.getValues(); int numLabels = labels.count(); for (int l = 0; l < numLabels; l++) { if (pLabels->section == section_id) { pLabels->value += section_address; pLabels->section = section_new; if (pLabels->mapIndex>=0 && pLabels->mapIndex<(int)map.size()) { struct MapSymbol &msym = map[pLabels->mapIndex]; msym.value = pLabels->value; msym.section = (int16_t)section_new; } CheckLateEval(pLabels->label_name); } ++pLabels; } } // go through relocs in all sections to see if any targets this section // relocate section to address! StatusCode Asm::LinkRelocs(int section_id, int section_new, int section_address) { for (std::vector

::iterator j = allSections.begin(); j != allSections.end(); ++j) { Section &s2 = *j; if (s2.pRelocs) { relocList *pList = s2.pRelocs; relocList::iterator i = pList->end(); while (i != pList->begin()) { --i; if (i->target_section == section_id) { Section *trg_sect = &s2; size_t output_offs = 0; while (trg_sect->merged_offset>=0) { output_offs += trg_sect->merged_offset; trg_sect = &allSections[trg_sect->merged_section]; } // only finalize the target value if fixed address if (section_new == -1 || allSections[section_new].address_assigned) { uint8_t *trg = trg_sect->output + output_offs + i->section_offset; int value = i->base_value + section_address; if (i->shift < 0) value >>= -i->shift; else if (i->shift) value <<= i->shift; for (int b = 0; b < i->bytes; b++) *trg++ = (uint8_t)(value >> (b * 8)); i = pList->erase(i); if (i != pList->end()) ++i; } } } if (pList->empty()) { free(pList); s2.pRelocs = nullptr; } } } return STATUS_OK; } // Append one section to the end of another StatusCode Asm::AssignAddressToSection(int section_id, int address) { if (section_id<0||section_id>=(int)allSections.size()) { return ERROR_NOT_A_SECTION; } Section &s = allSections[section_id]; if (s.address_assigned) return ERROR_CANT_REASSIGN_FIXED_SECTION; // fix up the alignment of the address int align_size = s.align_address<=1 ? 0 : (s.align_address - (address%s.align_address))%s.align_address; address += align_size; s.start_address = address; s.address += address; s.address_assigned = true; LinkLabelsToAddress(section_id, -1, s.start_address); return LinkRelocs(section_id, -1, s.start_address); } // Link sections with a specific name at this point // Relative sections will just be appeneded to a grouping list // Fixed address sections will be merged together StatusCode Asm::LinkSections(strref name) { if (CurrSection().IsDummySection()) { return ERROR_LINKER_CANT_LINK_TO_DUMMY_SECTION; } int last_section_group = CurrSection().next_group; while (last_section_group > -1 && allSections[last_section_group].next_group > -1) last_section_group = allSections[last_section_group].next_group; for (std::vector

::iterator i = allSections.begin(); i != allSections.end(); ++i) { if ((!name || i->name.same_str_case(name)) && i->IsRelativeSection() && !i->IsMergedSection()) { // it is ok to link other sections with the same name to this section if (&*i==&CurrSection()) { continue; } // Zero page sections can only be linked with zero page sections if (i->type != ST_ZEROPAGE || CurrSection().type == ST_ZEROPAGE) { i->export_append = CurrSection().export_append; if (!i->address_assigned) { if (i->first_group < 0) { int prev = last_section_group >= 0 ? last_section_group : SectionId(); int curr = (int)(&*i - &allSections[0]); allSections[prev].next_group = curr; i->first_group = CurrSection().first_group ? CurrSection().first_group : SectionId(); last_section_group = curr; } } } else { return ERROR_CANT_LINK_ZP_AND_NON_ZP; } } } return STATUS_OK; } StatusCode Asm::MergeSections(int section_id, int section_merge) { if (section_id==section_merge||section_id<0||section_merge<0) { return STATUS_OK; } Section &s = allSections[section_id]; Section &m = allSections[section_merge]; // merging section needs to be relative to be appended if (!m.IsRelativeSection()) { return ERROR_CANT_APPEND_SECTION_TO_TARGET; } // if merging section is aligned and target section is not aligned to that or multiple of then can't merge if (m.align_address>1&&(!s.IsRelativeSection()||(s.align_address%m.align_address)!=0)) { return ERROR_CANT_APPEND_SECTION_TO_TARGET; } // append the binary to the target.. int addr_start = s.address; int align = m.align_address <= 1 ? 0 : (m.align_address - (addr_start % m.align_address)) % m.align_address; if (m.size()) { if (s.CheckOutputCapacity(m.size() + align) == STATUS_OK) { for (int a = 0; acapacity()<(s.pRelocs->size()+m.pRelocs->size())) { s.pRelocs->reserve(s.pRelocs->size()+m.pRelocs->size()); } for (relocList::iterator r = m.pRelocs->begin(); r!=m.pRelocs->end(); ++r) { struct Reloc rel = *r; rel.section_offset += addr_start; s.pRelocs->push_back(rel); } delete m.pRelocs; m.pRelocs = nullptr; } // go through all the relocs referring to merging section and replace for (std::vector

::iterator i = allSections.begin(); i!=allSections.end(); ++i) { if (relocList *pReloc = i->pRelocs) { for (relocList::iterator r = pReloc->begin(); r!=pReloc->end(); ++r) { if (r->target_section == section_merge) { r->base_value += addr_start; r->target_section = section_id; } } } } if(!s.IsRelativeSection()) { LinkLabelsToAddress(section_merge, -1, m.start_address); } // go through all labels referencing merging section for (uint32_t i = 0; isection == section_merge) { i->value += addr_start; i->section = (int16_t)section_id; } } // go through all late evals referencing this section for (std::vector::iterator i = lateEval.begin(); i!=lateEval.end(); ++i) { if (i->section == section_merge) { i->section = (int16_t)section_id; if (i->target>=0) { i->target += addr_start; } i->address += addr_start; if (i->scope>=0) { i->scope += addr_start; } } } // go through listing if (m.pListing) { if (!s.pListing) { s.pListing = new Listing; } if (s.pListing->capacity()<(m.pListing->size()+s.pListing->size())) { s.pListing->reserve((m.pListing->size()+s.pListing->size())); } for (Listing::iterator i = m.pListing->begin(); i!=m.pListing->end(); ++i) { ListLine l = *i; l.address += addr_start; s.pListing->push_back(l); } delete m.pListing; m.pListing = nullptr; } m.type = ST_REMOVED; return STATUS_OK; } // Go through sections and merge same name sections together StatusCode Asm::MergeSectionsByName(int first_section) { int first_code_seg = -1; StatusCode status = STATUS_OK; for (std::vector

::iterator i = allSections.begin(); i != allSections.end(); ++i) { if (i->type != ST_REMOVED) { if (first_code_seg<0 && i->type==ST_CODE) first_code_seg = (int)(&*i-&allSections[0]); std::vector

::iterator n = i; ++n; while (n != allSections.end()) { if (n->name.same_str_case(i->name) && n->type == i->type) { int sk = (int)(&*i - &allSections[0]); int sm = (int)(&*n - &allSections[0]); if (sm == first_section || (n->align_address > i->align_address)) { if (n->align_addressalign_address) { n->align_address = i->align_address; } status = MergeSections(sm, sk); } else { status = MergeSections(sk, sm); } if (status!=STATUS_OK) { return status; } } ++n; } } } return STATUS_OK; } // Merge all sections in order of code, data, bss and make sure a specific section remains first #define MERGE_ORDER_CNT (ST_BSS - ST_CODE+1) StatusCode Asm::MergeAllSections(int first_section) { StatusCode status = STATUS_OK; // combine all sections by type first for (int t = ST_CODE; tallSections[j].align_address) { allSections[i].align_address = allSections[j].align_address; } status = MergeSections(j, i); } else status = MergeSections(i, j); } } } } } // then combine by category except zero page int merge_order[MERGE_ORDER_CNT] = { -1 }; for (int t = ST_CODE; t <= ST_BSS; t++) { for (int i = 0; i<(int)allSections.size(); ++i) { if (allSections[i].type == t) { merge_order[t - ST_CODE] = i; break; } } } for (int n = 1; n < MERGE_ORDER_CNT; n++) { if (merge_order[n] == -1) { for (int m = n + 1; m < MERGE_ORDER_CNT; m++) merge_order[m - 1] = merge_order[m]; } } if (merge_order[0]==-1) { return ERROR_NOT_A_SECTION; } for (int o = 1; o < MERGE_ORDER_CNT; o++) { if (merge_order[o] != -1 && status == STATUS_OK) { if (allSections[merge_order[0]].align_address= output_capacity) { size_t newSize = currSize * 2; if (newSize<64*1024) { newSize = 64*1024; } if ((addSize+currSize)>newSize) { newSize += newSize; } if (uint8_t *new_output = (uint8_t*)malloc(newSize)) { memcpy(new_output, output, size()); curr = new_output + (curr - output); free(output); output = new_output; output_capacity = newSize; } else { return ERROR_OUT_OF_MEMORY; } } return STATUS_OK; } // Add one byte to a section void Section::AddByte(int b) { if (!dummySection && type != ST_ZEROPAGE && type != ST_BSS) { if (CheckOutputCapacity(1)==STATUS_OK) { *curr++ = (uint8_t)b; } } address++; } // Add a 16 bit word to a section void Section::AddWord(int w) { if (!dummySection && type != ST_ZEROPAGE && type != ST_BSS) { if (CheckOutputCapacity(2) == STATUS_OK) { *curr++ = (uint8_t)(w & 0xff); *curr++ = (uint8_t)(w >> 8); } } address += 2; } // Add a 24 bit word to a section void Section::AddTriple(int l) { if (!dummySection && type != ST_ZEROPAGE && type != ST_BSS) { if (CheckOutputCapacity(3) == STATUS_OK) { *curr++ = (uint8_t)(l & 0xff); *curr++ = (uint8_t)(l >> 8); *curr++ = (uint8_t)(l >> 16); } } address += 3; } // Add arbitrary length data to a section void Section::AddBin(const uint8_t *p, int size) { if (!dummySection && type != ST_ZEROPAGE && type != ST_BSS) { if (CheckOutputCapacity(size) == STATUS_OK) { memcpy(curr, p, size); curr += size; } } address += size; } // Add text data to a section void Section::AddText(strref line, strref text_prefix) { // https://en.wikipedia.org/wiki/PETSCII // ascii: no change // shifted: a-z => $41.. A-Z => $61.. // unshifted: a-z, A-Z => $41 if (CheckOutputCapacity((uint32_t)line.get_len()) == STATUS_OK) { if (!text_prefix || text_prefix.same_str("ascii")) { AddBin((const uint8_t*)line.get(), (int)line.get_len()); } else if (text_prefix.same_str("petscii")) { while (line) { char c = line[0]; AddByte((c >= 'a' && c <= 'z') ? (c - 'a' + 'A') : (c > 0x60 ? ' ' : line[0])); ++line; } } else if (text_prefix.same_str("petscii_shifted")) { while (line) { char c = line[0]; AddByte((c >= 'a' && c <= 'z') ? (c - 'a' + 0x61) : ((c >= 'A' && c <= 'Z') ? (c - 'A' + 0x61) : (c > 0x60 ? ' ' : line[0]))); ++line; } } } } void Section::AddIndexText(StringSymbol *strSym, strref text) { if (CheckOutputCapacity((uint32_t)text.get_len())==STATUS_OK) { const strref lookup = strSym->get(); while (text) { char c = text.pop_first(); AddByte(lookup.find(c)); } } } // Add a relocation marker to a section void Section::AddReloc(int base, int offset, int section, int8_t bytes, int8_t shift) { if (!pRelocs) { pRelocs = new relocList; } if (pRelocs->size()==pRelocs->capacity()) { pRelocs->reserve(pRelocs->size()+32); } pRelocs->push_back(Reloc(base, offset, section, bytes, shift)); } // Make sure there is room to assemble in StatusCode Asm::CheckOutputCapacity(uint32_t addSize) { return CurrSection().CheckOutputCapacity(addSize); } // // // SCOPE MANAGEMENT // // StatusCode Asm::EnterScope() { if (scope_depth>=(MAX_SCOPE_DEPTH-1)) { return ERROR_TOO_DEEP_SCOPE; } scope_address[++scope_depth] = CurrSection().GetPC(); return STATUS_OK; } StatusCode Asm::ExitScope() { CheckLateEval(strref(), CurrSection().GetPC()); StatusCode error = FlushLocalLabels(scope_depth); if (error>=FIRST_ERROR) { return error; } --scope_depth; if (scope_depth<0) { return ERROR_UNBALANCED_SCOPE_CLOSURE; } return STATUS_OK; } // // // CONTEXT ISOLATION // // StatusCode Asm::PushContext(strref src_name, strref src_file, strref code_seg, int rept) { if (conditional_depth>=(MAX_CONDITIONAL_DEPTH-1)) { return ERROR_CONDITION_TOO_NESTED; } conditional_depth++; conditional_nesting[conditional_depth] = 0; conditional_consumed[conditional_depth] = false; contextStack.push(src_name, src_file, code_seg, rept); contextStack.curr().conditional_ctx = (int16_t)conditional_depth; if (scope_depth>=(MAX_SCOPE_DEPTH-1)) { return ERROR_TOO_DEEP_SCOPE; } else { scope_address[++scope_depth] = CurrSection().GetPC(); } return STATUS_OK; } StatusCode Asm::PopContext() { if (scope_depth) { StatusCode ret = ExitScope(); if (ret!=STATUS_OK) { return ret; } } if (!ConditionalAsm()||ConditionalConsumed()|| conditional_depth!=contextStack.curr().conditional_ctx) { return ERROR_UNTERMINATED_CONDITION; } conditional_depth = contextStack.curr().conditional_ctx-1; contextStack.pop(); return STATUS_OK; } // // // MACROS // // // add a custom macro StatusCode Asm::AddMacro(strref macro, strref source_name, strref source_file, strref &left) { // // Recommended macro syntax: // macro name(optional params) { actual macro } // // -endm option macro syntax: // macro name arg // actual macro // endmacro // // Merlin macro syntax: (TODO: ignore arguments and use ]1, ]2, etc.) // name mac arg1 arg2 // actual macro // [<<<]/[EOM] // strref name; bool params_first_line = false; if (Merlin()) { if (Label *pLastLabel = GetLabel(last_label)) { labels.remove((uint32_t)(pLastLabel - labels.getValues())); name = last_label; last_label.clear(); macro.skip_whitespace(); if (macro.get_first()==';'||macro.has_prefix(c_comment)) { macro.line(); } else { params_first_line = true; } } else { return ERROR_BAD_MACRO_FORMAT; } } else { name = macro.split_range(label_end_char_range); macro.skip_whitespace(); strref left_line = macro.get_line(); left_line.skip_whitespace(); left_line = left_line.before_or_full(';').before_or_full(c_comment); if (left_line && left_line[0]!='(' && left_line[0]!='{') { params_first_line = true; } } uint32_t hash = name.fnv1a(); uint32_t ins = FindLabelIndex(hash, macros.getKeys(), macros.count()); Macro *pMacro = nullptr; while (ins < macros.count() && macros.getKey(ins)==hash) { if (name.same_str_case(macros.getValue(ins).name)) { pMacro = macros.getValues() + ins; break; } ++ins; } if (!pMacro) { macros.insert(ins, hash); pMacro = macros.getValues() + ins; } pMacro->name = name; if (Merlin()) { strref source = macro; while (strref next_line = macro.line()) { next_line = next_line.before_or_full(';'); next_line = next_line.before_or_full(c_comment); int term = next_line.find("<<<"); if (term<0) { term = next_line.find("EOM"); } if (term >= 0) { strl_t macro_len = strl_t(next_line.get() + term - source.get()); source = source.get_substr(0, macro_len); break; } } left = macro; pMacro->macro = source; source.skip_whitespace(); } else if (end_macro_directive) { int f = -1; const strref endm("endm"); for (;;) { f = macro.find(endm, f+1); if (f<0) { return ERROR_BAD_MACRO_FORMAT; } if (f==0||strref::is_ws(macro[f-1])) { break; } } pMacro->macro = macro.get_substr(0, f); macro += f; macro.line(); left = macro; } else { int pos_bracket = macro.find('{'); if (pos_bracket < 0) { pMacro->macro = strref(); return ERROR_BAD_MACRO_FORMAT; } strref source = macro + pos_bracket; strref macro_body = source.scoped_block_skip(); pMacro->macro = strref(macro.get(), pos_bracket + macro_body.get_len() + 2); source.skip_whitespace(); left = source; } pMacro->source_name = source_name; pMacro->source_file = source_file; pMacro->params_first_line = params_first_line; return STATUS_OK; } // Compile in a macro StatusCode Asm::BuildMacro(Macro &m, strref arg_list) { strref macro_src = m.macro, params; if (m.params_first_line) { if (end_macro_directive||Merlin()) { params = macro_src.line(); } else { params = macro_src.before('{'); macro_src += params.get_len(); } } else { params = (macro_src[0]=='(' ? macro_src.scoped_block_skip() : strref()); } params.trim_whitespace(); arg_list.trim_whitespace(); if (Merlin()) { // need to include comment field because separator is ; if (contextStack.curr().read_source.is_substr(arg_list.get())) arg_list = (contextStack.curr().read_source + strl_t(arg_list.get()-contextStack.curr().read_source.get()) ).line(); arg_list = arg_list.before_or_full(c_comment).get_trimmed_ws(); strref arg = arg_list; strown<16> tag; int t_max = 16; int dSize = 0; for (int t=1; t 0) { for (int skip = 1; skip < t; skip++) args.split_token_trim(';'); strref a = args.split_token_trim(';'); macexp.exchange(offs, tag_mac.get_len(), a); pos += a.get_len(); success = true; } } if (!success) { return ERROR_MACRO_ARGUMENT; } } } PushContext(m.source_name, macexp.get_strref(), macexp.get_strref()); return STATUS_OK; } else { return ERROR_OUT_OF_MEMORY_FOR_MACRO_EXPANSION; } } else if (params) { if (arg_list[0]=='(') arg_list = arg_list.scoped_block_skip(); strref pchk = params; strref arg = arg_list; int dSize = 0; char token = arg_list.find(',')>=0 ? ',' : ' '; char token_macro = m.params_first_line && params.find(',') < 0 ? ' ' : ','; while (strref param = pchk.split_token_trim(token_macro)) { strref a = arg.split_token_trim(token); if (param.get_len() < a.get_len()) { int count = macro_src.substr_case_count(param); dSize += count * ((int)a.get_len() - (int)param.get_len()); } } int mac_size = (int)macro_src.get_len() + dSize + 32; if (char *buffer = (char*)malloc(mac_size)) { loadedData.push_back(buffer); strovl macexp(buffer, mac_size); macexp.copy(macro_src); while (strref param = params.split_token_trim(token_macro)) { strref a = arg_list.split_token_trim(token); macexp.replace_bookend(param, a, label_end_char_range); } PushContext(m.source_name, macexp.get_strref(), macexp.get_strref()); return STATUS_OK; } else { return ERROR_OUT_OF_MEMORY_FOR_MACRO_EXPANSION; } } PushContext(m.source_name, m.source_file, macro_src); return STATUS_OK; } // // // STRUCTS AND ENUMS // // // Enums are Structs in disguise StatusCode Asm::BuildEnum(strref name, strref declaration) { uint32_t hash = name.fnv1a(); uint32_t ins = FindLabelIndex(hash, labelStructs.getKeys(), labelStructs.count()); LabelStruct *pEnum = nullptr; while (ins < labelStructs.count() && labelStructs.getKey(ins)==hash) { if (name.same_str_case(labelStructs.getValue(ins).name)) { pEnum = labelStructs.getValues() + ins; break; } ++ins; } if (pEnum) { return ERROR_STRUCT_ALREADY_DEFINED; } labelStructs.insert(ins, hash); pEnum = labelStructs.getValues() + ins; pEnum->name = name; pEnum->first_member = (uint16_t)structMembers.size(); pEnum->numMembers = 0; pEnum->size = 0; // enums are 0 sized int value = 0; struct EvalContext etx; SetEvalCtxDefaults(etx); while (strref line = declaration.line()) { line = line.before_or_full(','); line.trim_whitespace(); strref member_name = line.split_token_trim('='); line = line.before_or_full(';').before_or_full(c_comment).get_trimmed_ws(); if (line) { StatusCode error = EvalExpression(line, etx, value); if (error==STATUS_NOT_READY||error==STATUS_XREF_DEPENDENT) { return ERROR_ENUM_CANT_BE_ASSEMBLED; } else if (error!=STATUS_OK) { return error; } } struct MemberOffset member; member.offset = (uint16_t)value; member.name = member_name; member.name_hash = member.name.fnv1a(); member.sub_struct = strref(); structMembers.push_back(member); ++value; pEnum->numMembers++; } return STATUS_OK; } StatusCode Asm::BuildStruct(strref name, strref declaration) { uint32_t hash = name.fnv1a(); uint32_t ins = FindLabelIndex(hash, labelStructs.getKeys(), labelStructs.count()); LabelStruct *pStruct = nullptr; while (ins < labelStructs.count() && labelStructs.getKey(ins)==hash) { if (name.same_str_case(labelStructs.getValue(ins).name)) { pStruct = labelStructs.getValues() + ins; break; } ++ins; } if (pStruct) { return ERROR_STRUCT_ALREADY_DEFINED; } labelStructs.insert(ins, hash); pStruct = labelStructs.getValues() + ins; pStruct->name = name; pStruct->first_member = (uint16_t)structMembers.size(); uint32_t byte_hash = struct_byte.fnv1a(); uint32_t word_hash = struct_word.fnv1a(); uint16_t size = 0; uint16_t member_count = 0; while (strref line = declaration.line()) { line.trim_whitespace(); strref type = line.split_label(); if (!type) { continue; } line.skip_whitespace(); uint32_t type_hash = type.fnv1a(); uint16_t type_size = 0; LabelStruct *pSubStruct = nullptr; if (type_hash==byte_hash && struct_byte.same_str_case(type)) { type_size = 1; } else if (type_hash==word_hash && struct_word.same_str_case(type)) { type_size = 2; } else { uint32_t index = FindLabelIndex(type_hash, labelStructs.getKeys(), labelStructs.count()); while (index < labelStructs.count() && labelStructs.getKey(index)==type_hash) { if (type.same_str_case(labelStructs.getValue(index).name)) { pSubStruct = labelStructs.getValues() + index; break; } ++index; } if (!pSubStruct) { labelStructs.remove(ins); return ERROR_REFERENCED_STRUCT_NOT_FOUND; } type_size = pSubStruct->size; } // add the new member, don't grow vectors one at a time. if (structMembers.size()==structMembers.capacity()) { structMembers.reserve(structMembers.size()+64); } struct MemberOffset member; member.offset = size; member.name = line.get_label(); member.name_hash = member.name.fnv1a(); member.sub_struct = pSubStruct ? pSubStruct->name : strref(); structMembers.push_back(member); size += type_size; member_count++; } { // add a trailing member of 0 bytes to access the size of the structure struct MemberOffset bytes_member; bytes_member.offset = size; bytes_member.name = "bytes"; bytes_member.name_hash = bytes_member.name.fnv1a(); bytes_member.sub_struct = strref(); structMembers.push_back(bytes_member); member_count++; } pStruct->numMembers = member_count; pStruct->size = size; return STATUS_OK; } // Evaluate a struct offset as if it was a label StatusCode Asm::EvalStruct(strref name, int &value) { LabelStruct *pStruct = nullptr; uint16_t offset = 0; while (strref struct_seg = name.split_token('.')) { strref sub_struct = struct_seg; uint32_t seg_hash = struct_seg.fnv1a(); if (pStruct) { struct MemberOffset *member = &structMembers[pStruct->first_member]; bool found = false; for (int i = 0; inumMembers; i++) { if (member->name_hash == seg_hash && member->name.same_str_case(struct_seg)) { offset += member->offset; sub_struct = member->sub_struct; found = true; break; } ++member; } if (!found) { return ERROR_REFERENCED_STRUCT_NOT_FOUND; } } if (sub_struct) { uint32_t hash = sub_struct.fnv1a(); uint32_t index = FindLabelIndex(hash, labelStructs.getKeys(), labelStructs.count()); while (index < labelStructs.count() && labelStructs.getKey(index)==hash) { if (sub_struct.same_str_case(labelStructs.getValue(index).name)) { pStruct = labelStructs.getValues() + index; break; } ++index; } } else if (name) { return STATUS_NOT_STRUCT; } } if (pStruct==nullptr) { return STATUS_NOT_STRUCT; } value = offset; return STATUS_OK; } // // // EXPRESSIONS AND LATE EVALUATION // // int Asm::ReptCnt() const { return contextStack.curr().repeat_total - contextStack.curr().repeat; } void Asm::SetEvalCtxDefaults(struct EvalContext &etx) { etx.pc = CurrSection().GetPC(); // current address at point of eval etx.scope_pc = scope_address[scope_depth]; // current scope open at point of eval etx.scope_end_pc = -1; // late scope closure after eval etx.scope_depth = scope_depth; // scope depth for eval (must match current for scope_end_pc to eval) etx.relative_section = -1; // return can be relative to this section etx.file_ref = -1; // can access private label from this file or -1 etx.rept_cnt = ReptCnt(); // current repeat counter } // Get a single token from a merlin expression EvalOperator Asm::RPNToken_Merlin(strref &expression, const struct EvalContext &etx, EvalOperator prev_op, int16_t §ion, int &value) { char c = expression.get_first(); switch (c) { case '$': ++expression; value = (int)expression.ahextoui_skip(); return EVOP_VAL; case '-': ++expression; return EVOP_SUB; case '+': ++expression; return EVOP_ADD; case '*': // asterisk means both multiply and current PC, disambiguate! ++expression; if (expression[0]=='*') return EVOP_STP; // double asterisks indicates comment else if (prev_op==EVOP_VAL||prev_op==EVOP_RPR) return EVOP_MUL; value = etx.pc; section = int16_t(CurrSection().IsRelativeSection() ? SectionId() : -1); return EVOP_VAL; case '/': ++expression; return EVOP_DIV; case '>': if (expression.get_len()>=2&&expression[1]=='>') { expression += 2; return EVOP_SHR; } ++expression; return EVOP_HIB; case '<': if (expression.get_len()>=2&&expression[1]=='<') { expression += 2; return EVOP_SHL; } ++expression; return EVOP_LOB; case '%': // % means both binary and scope closure, disambiguate! if (expression[1]=='0'||expression[1]=='1') { ++expression; value = (int)expression.abinarytoui_skip(); return EVOP_VAL; } if (etx.scope_end_pc<0||scope_depth!=etx.scope_depth) return EVOP_NRY; ++expression; value = etx.scope_end_pc; section = int16_t(CurrSection().IsRelativeSection() ? SectionId() : -1); return EVOP_VAL; case '|': case '.': ++expression; return EVOP_OR; // MERLIN: . is or, | is not used case '^': if (prev_op==EVOP_VAL||prev_op==EVOP_RPR) { ++expression; return EVOP_EOR; } ++expression; return EVOP_BAB; case '&': ++expression; return EVOP_AND; case '(': if (prev_op!=EVOP_VAL) { ++expression; return EVOP_LPR; } return EVOP_STP; case ')': ++expression; return EVOP_RPR; case '"': if (expression[2]=='"') { value = expression[1]; expression += 3; return EVOP_VAL; } return EVOP_STP; case '\'': if (expression[2]=='\'') { value = expression[1]; expression += 3; return EVOP_VAL; } return EVOP_STP; case ',': case '?': return EVOP_STP; } if (c == '!' && (prev_op == EVOP_VAL || prev_op == EVOP_RPR)) { ++expression; return EVOP_EOR; } else if (c == '!' && !(expression + 1).len_label()) { if (etx.scope_pc < 0) return EVOP_NRY; // ! by itself is current scope, !+label char is a local label ++expression; value = etx.scope_pc; section = int16_t(CurrSection().IsRelativeSection() ? SectionId() : -1); return EVOP_VAL; } else if (expression.match_chars_str("0-9", "!a-zA-Z_")) { if (prev_op == EVOP_VAL) return EVOP_STP; // value followed by value doesn't make sense, stop value = expression.atoi_skip(); return EVOP_VAL; } else if (c == '!' || c == ']' || c==':' || strref::is_valid_label(c)) { if (prev_op == EVOP_VAL) return EVOP_STP; // a value followed by a value does not make sense, probably start of a comment (ORCA/LISA?) char e0 = expression[0]; int start_pos = (e0==']' || e0==':' || e0=='!' || e0=='.') ? 1 : 0; strref label = expression.split_range_trim(label_end_char_range_merlin, start_pos); Label *pLabel = pLabel = GetLabel(label, etx.file_ref); if (!pLabel) { StatusCode ret = EvalStruct(label, value); if (ret==STATUS_OK) { return EVOP_VAL; } if (ret!=STATUS_NOT_STRUCT) { return EVOP_ERR; } // partial struct } if (!pLabel && label.same_str("rept")) { value = etx.rept_cnt; return EVOP_VAL; } if (!pLabel||!pLabel->evaluated) { return EVOP_NRY; } // this label could not be found (yet) value = pLabel->value; section = int16_t(pLabel->section); return EVOP_VAL; } return EVOP_ERR; } // Get a single token from most non-apple II assemblers EvalOperator Asm::RPNToken(strref &exp, const struct EvalContext &etx, EvalOperator prev_op, int16_t §ion, int &value, strref &subexp) { char c = exp.get_first(); switch (c) { case '$': ++exp; value = (int)exp.ahextoui_skip(); return EVOP_VAL; case '-': ++exp; return EVOP_SUB; case '+': ++exp; return EVOP_ADD; case '*': // asterisk means both multiply and current PC, disambiguate! ++exp; if (exp[0] == '*') return EVOP_STP; // double asterisks indicates comment else if (prev_op == EVOP_VAL || prev_op == EVOP_RPR) return EVOP_MUL; value = etx.pc; section = int16_t(CurrSection().IsRelativeSection() ? SectionId() : -1); return EVOP_VAL; case '/': ++exp; return EVOP_DIV; case '=': if (exp[1] == '=') { exp += 2; return EVOP_EQU; } return EVOP_STP; case '>': if (exp.get_len() >= 2 && exp[1] == '>') { exp += 2; return EVOP_SHR; } if (prev_op == EVOP_VAL || prev_op == EVOP_RPR) { ++exp; if (exp[0] == '=') { ++exp; return EVOP_GTE; } return EVOP_GT; } ++exp; return EVOP_HIB; case '<': if (exp.get_len() >= 2 && exp[1] == '<') { exp += 2; return EVOP_SHL; } if (prev_op == EVOP_VAL || prev_op == EVOP_RPR) { ++exp; if (exp[0] == '=') { ++exp; return EVOP_LTE; } return EVOP_LT; } ++exp; return EVOP_LOB; case '%': // % means both binary and scope closure, disambiguate! if (exp[1] == '0' || exp[1] == '1') { ++exp; value = (int)exp.abinarytoui_skip(); return EVOP_VAL; } if (etx.scope_end_pc<0 || scope_depth != etx.scope_depth) return EVOP_NRY; ++exp; value = etx.scope_end_pc; section = int16_t(CurrSection().IsRelativeSection() ? SectionId() : -1); return EVOP_VAL; case '|': ++exp; return EVOP_OR; case '^': if (prev_op == EVOP_VAL || prev_op == EVOP_RPR) { ++exp; return EVOP_EOR; } ++exp; return EVOP_BAB; case '&': ++exp; return EVOP_AND; case '(': if (prev_op != EVOP_VAL) { ++exp; return EVOP_LPR; } return EVOP_STP; case ')': ++exp; return EVOP_RPR; case ',': case '?': case '\'': return EVOP_STP; } // ! by itself is current scope, !+label char is a local label if (c == '!' && !(exp + 1).len_label()) { if (etx.scope_pc < 0) return EVOP_NRY; ++exp; value = etx.scope_pc; section = int16_t(CurrSection().IsRelativeSection() ? SectionId() : -1); return EVOP_VAL; } else if (exp.match_chars_str("0-9", "!a-zA-Z_")) { if (prev_op == EVOP_VAL) return EVOP_STP; // value followed by value doesn't make sense, stop value = exp.atoi_skip(); return EVOP_VAL; } else if (c == '!' || c == ':' || c=='.' || c=='@' || strref::is_valid_label(c)) { if (prev_op == EVOP_VAL) return EVOP_STP; // a value followed by a value does not make sense, probably start of a comment (ORCA/LISA?) char e0 = exp[0]; int start_pos = (e0 == ':' || e0 == '!' || e0 == '.') ? 1 : 0; strref label = exp.split_range_trim(label_end_char_range, start_pos); Label *pLabel = pLabel = GetLabel(label, etx.file_ref); if (!pLabel) { StatusCode ret = EvalStruct(label, value); if (ret==STATUS_OK) { return EVOP_VAL; } if (ret!=STATUS_NOT_STRUCT) { return EVOP_ERR; } // partial struct } if (!pLabel && label.same_str("rept")) { value = etx.rept_cnt; return EVOP_VAL; } if (!pLabel) { if (StringSymbol *pStr = GetString(label)) { subexp = pStr->get(); return EVOP_EXP; } } if (!pLabel || !pLabel->evaluated) return EVOP_NRY; // this label could not be found (yet) value = pLabel->value; section = int16_t(pLabel->section); return pLabel->reference ? EVOP_XRF : EVOP_VAL; } return EVOP_ERR; } // // EvalExpression // Uses the Shunting Yard algorithm to convert to RPN first // which makes the actual calculation trivial and avoids recursion. // https://en.wikipedia.org/wiki/Shunting-yard_algorithm // // Return: // STATUS_OK means value is completely evaluated // STATUS_NOT_READY means value could not be evaluated right now // ERROR_* means there is an error in the expression // // Max number of unresolved sections to evaluate in a single expression #define MAX_EVAL_SECTIONS 4 // determine if a scalar can be a shift static int mul_as_shift(int scalar) { int shift = 0; while (scalar > 1 && (scalar & 1) == 0) { shift++; scalar >>= 1; } return scalar == 1 ? shift : 0; } #define MAX_EXPR_STACK 2 StatusCode Asm::EvalExpression(strref expression, const struct EvalContext &etx, int &result) { int numValues = 0; int numOps = 0; strref expression_stack[MAX_EXPR_STACK]; int exp_sp = 0; char ops[MAX_EVAL_OPER]; // RPN expression int values[MAX_EVAL_VALUES]; // RPN values (in order of RPN EVOP_VAL operations) int16_t section_ids[MAX_EVAL_SECTIONS]; // local index of each referenced section int16_t section_val[MAX_EVAL_VALUES] = { 0 }; // each value can be assigned to one section, or -1 if fixed int16_t num_sections = 0; // number of sections in section_ids (normally 0 or 1, can be up to MAX_EVAL_SECTIONS) bool xrefd = false; values[0] = 0; // Initialize RPN if no expression { int sp = 0; char op_stack[MAX_EVAL_OPER]; EvalOperator prev_op = EVOP_NONE; expression.trim_whitespace(); while (expression || exp_sp) { int value = 0; int16_t section = -1, index_section = -1; EvalOperator op = EVOP_NONE; strref subexp; if (!expression && exp_sp) { expression = expression_stack[--exp_sp]; op = EVOP_RPR; } else if (Merlin()) { op = RPNToken_Merlin(expression, etx, prev_op, section, value); } else { op = RPNToken(expression, etx, prev_op, section, value, subexp); } if (op==EVOP_ERR) { return ERROR_UNEXPECTED_CHARACTER_IN_EXPRESSION; } else if (op==EVOP_NRY) { return STATUS_NOT_READY; } else if (op == EVOP_EXP) { if (exp_sp>=MAX_EXPR_STACK) { return ERROR_TOO_MANY_VALUES_IN_EXPRESSION; } expression_stack[exp_sp++] = expression; expression = subexp; op = EVOP_LPR; } else if (op == EVOP_XRF) { xrefd = true; op = EVOP_VAL; } if (section >= 0) { for (int s = 0; s= EVOP_EQU && prev_op <= EVOP_GTE) || (prev_op==EVOP_HIB || prev_op==EVOP_LOB)) { if (op==EVOP_SUB) { op = EVOP_NEG; } else if (op==EVOP_ADD) { skip = true; } } if (op==EVOP_SUB && sp && prev_op==EVOP_SUB) { sp--; } else { while (sp && !skip) { EvalOperator p = (EvalOperator)op_stack[sp-1]; if (p==EVOP_LPR||op>p) { break; } ops[numOps++] = (char)p; sp--; } op_stack[sp++] = (char)op; } } // check for out of bounds or unexpected input if (numValues==MAX_EVAL_VALUES) { return ERROR_TOO_MANY_VALUES_IN_EXPRESSION; } else if (numOps==MAX_EVAL_OPER||sp==MAX_EVAL_OPER) { return ERROR_TOO_MANY_OPERATORS_IN_EXPRESSION; } prev_op = op; expression.skip_whitespace(); } while (sp) { sp--; ops[numOps++] = op_stack[sp]; } } // Check if dependent on XREF'd symbol if (xrefd) { return STATUS_XREF_DEPENDENT; } // processing the result RPN will put the completed expression into values[0]. // values is used as both the queue and the stack of values since reads/writes won't // exceed itself. { int valIdx = 0; int ri = 0; // RPN index (value) int prev_val = values[0]; int shift_bits = 0; // special case for relative reference to low byte / high byte int16_t section_counts[MAX_EVAL_SECTIONS][MAX_EVAL_VALUES] = { 0 }; for (int o = 0; o ri--; values[ri - 1] = values[ri - 1] > values[ri]; break; case EVOP_LT: // < ri--; values[ri - 1] = values[ri - 1] < values[ri]; break; case EVOP_GTE: // >= ri--; values[ri - 1] = values[ri - 1] >= values[ri]; break; case EVOP_LTE: // >= ri--; values[ri - 1] = values[ri - 1] <= values[ri]; break; case EVOP_ADD: // + ri--; for (int i = 0; i1) { ri--; for (int i = 0; i=1) { values[ri-1] = -values[ri-1]; } break; case EVOP_MUL: // * ri--; for (int i = 0; i> ri--; for (int i = 0; i>= values[ri]; break; case EVOP_LOB: // low byte if (ri) { values[ri-1] &= 0xff; } break; case EVOP_HIB: if (ri) { shift_bits = -8; values[ri - 1] = values[ri - 1] >> 8; } break; case EVOP_BAB: if (ri) { shift_bits = -16; values[ri - 1] = (values[ri - 1] >> 16); } break; default: return ERROR_EXPRESSION_OPERATION; break; } if (shift_bits==0&&ri) { prev_val = values[ri-1]; } } int section_index = -1; bool curr_relative = false; // If relative to any section unless specifically interested in a relative value then return not ready for (int i = 0; i=0) { return STATUS_NOT_READY; } else if (etx.relative_section==section_ids[i]) { curr_relative = true; } else if (etx.relative_section>=0) { return STATUS_NOT_READY; } section_index = i; } } result = values[0]; if (section_index>=0 && !curr_relative) { lastEvalSection = section_ids[section_index]; lastEvalValue = prev_val; lastEvalShift = (int8_t)shift_bits; return STATUS_RELATIVE_SECTION; } } return STATUS_OK; } // if an expression could not be evaluated, add it along with // the action to perform if it can be evaluated later. void Asm::AddLateEval(int target, int pc, int scope_pc, strref expression, strref source_file, LateEval::Type type) { LateEval le; le.address = pc; le.scope = scope_pc; le.scope_depth = scope_depth; le.target = target; le.section = (int16_t)(&CurrSection() - &allSections[0]); le.rept = contextStack.curr().repeat_total - contextStack.curr().repeat; le.file_ref = -1; // current or xdef'd le.label.clear(); le.expression = expression; le.source_file = source_file; le.type = type; lateEval.push_back(le); } void Asm::AddLateEval(strref label, int pc, int scope_pc, strref expression, LateEval::Type type) { LateEval le; le.address = pc; le.scope = scope_pc; le.scope_depth = scope_depth; le.target = -1; le.label = label; le.section = (int16_t)(&CurrSection() - &allSections[0]); le.rept = contextStack.curr().repeat_total - contextStack.curr().repeat; le.file_ref = -1; // current or xdef'd le.expression = expression; le.source_file.clear(); le.type = type; lateEval.push_back(le); } // When a label is defined or a scope ends check if there are // any related late label evaluators that can now be evaluated. StatusCode Asm::CheckLateEval(strref added_label, int scope_end, bool print_missing_reference_errors) { bool evaluated_label = true; strref new_labels[MAX_LABELS_EVAL_ALL]; int num_new_labels = 0; if (added_label) { new_labels[num_new_labels++] = added_label; } bool all = !added_label; while (evaluated_label) { evaluated_label = false; std::vector::iterator i = lateEval.begin(); while (i != lateEval.end()) { int value = 0; // check if this expression is related to the late change (new label or end of scope) bool check = all || num_new_labels==MAX_LABELS_EVAL_ALL; for (int l = 0; lexpression.find(new_labels[l]) >= 0; if (!check && scope_end>0) { int gt_pos = 0; while (gt_pos>=0 && !check) { gt_pos = i->expression.find_at('%', gt_pos); if (gt_pos>=0) { if (i->expression[gt_pos+1]=='%') { gt_pos++; } else { check = true; } gt_pos++; } } } if (check) { struct EvalContext etx(i->address, i->scope, scope_end, i->type == LateEval::LET_BRANCH ? SectionId() : -1, i->rept); etx.scope_depth = i->scope_depth; etx.file_ref = i->file_ref; StatusCode ret = EvalExpression(i->expression, etx, value); if (ret == STATUS_OK || ret==STATUS_RELATIVE_SECTION) { // Check if target section merged with another section int trg = i->target; int sec = i->section; if (i->type != LateEval::LET_LABEL) { if (allSections[sec].IsMergedSection()) { trg += allSections[sec].merged_offset; sec = allSections[sec].merged_section; } } bool resolved = true; switch (i->type) { case LateEval::LET_BYTE: if (ret==STATUS_RELATIVE_SECTION) { if (i->section<0) { resolved = false; } else { allSections[sec].AddReloc(lastEvalValue, trg, lastEvalSection, 1, lastEvalShift); value = 0; } } if (trg>=allSections[sec].size()) { return ERROR_SECTION_TARGET_OFFSET_OUT_OF_RANGE; } allSections[sec].SetByte(trg, value); break; case LateEval::LET_ABS_REF: if (ret==STATUS_RELATIVE_SECTION) { if (i->section<0) { resolved = false; } else { allSections[sec].AddReloc(lastEvalValue, trg, lastEvalSection, 2, lastEvalShift); value = 0; } } if ((trg+1)>=allSections[sec].size()) { return ERROR_SECTION_TARGET_OFFSET_OUT_OF_RANGE; } allSections[sec].SetWord(trg, value); break; case LateEval::LET_ABS_L_REF: if (ret==STATUS_RELATIVE_SECTION) { if (i->section<0) { resolved = false; } else { allSections[sec].AddReloc(lastEvalValue, trg, lastEvalSection, 3, lastEvalShift); value = 0; } } if ((trg+2)>=allSections[sec].size()) { return ERROR_SECTION_TARGET_OFFSET_OUT_OF_RANGE; } allSections[sec].SetTriple(trg, value); break; case LateEval::LET_ABS_4_REF: if (ret==STATUS_RELATIVE_SECTION) { if (i->section<0) { resolved = false; } else { allSections[sec].AddReloc(lastEvalValue, trg, lastEvalSection, 4, lastEvalShift); value = 0; } } if ((trg+3)>=allSections[sec].size()) { return ERROR_SECTION_TARGET_OFFSET_OUT_OF_RANGE; } allSections[sec].SetQuad(trg, value); break; case LateEval::LET_BRANCH: value -= i->address+1; if (value<-128 || value>127) { i = lateEval.erase(i); return ERROR_BRANCH_OUT_OF_RANGE; } if (trg>=allSections[sec].size()) { return ERROR_SECTION_TARGET_OFFSET_OUT_OF_RANGE; } allSections[sec].SetByte(trg, value); break; case LateEval::LET_BRANCH_16: value -= i->address+2; if (trg>=allSections[sec].size()) { return ERROR_SECTION_TARGET_OFFSET_OUT_OF_RANGE; } allSections[sec].SetWord(trg, value); break; case LateEval::LET_LABEL: { Label *label = GetLabel(i->label, i->file_ref); if (!label) { return ERROR_LABEL_MISPLACED_INTERNAL; } label->value = value; label->evaluated = true; label->section = ret==STATUS_RELATIVE_SECTION ? i->section : -1; if (num_new_labelslabel_name; } evaluated_label = true; char f = i->label[0], l = i->label.get_last(); LabelAdded(label, f=='.' || f=='!' || f=='@' || f==':' || l=='$'); break; } default: break; } if (resolved) { i = lateEval.erase(i); } } else { if (print_missing_reference_errors && ret!=STATUS_XREF_DEPENDENT) { PrintError(i->expression, ret); error_encountered = true; } ++i; } } else { ++i; } } all = false; added_label.clear(); } return STATUS_OK; } // // // LABELS // // // Get a label record if it exists Label *Asm::GetLabel(strref label) { uint32_t label_hash = label.fnv1a(); uint32_t index = FindLabelIndex(label_hash, labels.getKeys(), labels.count()); while (index < labels.count() && label_hash == labels.getKey(index)) { if (label.same_str(labels.getValue(index).label_name)) { return labels.getValues()+index; } index++; } return nullptr; } // Get a protected label record from a file if it exists Label *Asm::GetLabel(strref label, int file_ref) { if (file_ref>=0 && file_ref<(int)externals.size()) { ExtLabels &labs = externals[file_ref]; uint32_t label_hash = label.fnv1a(); uint32_t index = FindLabelIndex(label_hash, labs.labels.getKeys(), labs.labels.count()); while (index < labs.labels.count() && label_hash == labs.labels.getKey(index)) { if (label.same_str(labs.labels.getValue(index).label_name)) { return labs.labels.getValues()+index; } index++; } } return GetLabel(label); } // If exporting labels, append this label to the list void Asm::LabelAdded(Label *pLabel, bool local) { if (pLabel && pLabel->evaluated) { if (map.size()==map.capacity()) { map.reserve(map.size()+256); } MapSymbol sym; sym.name = pLabel->label_name; sym.section = (int16_t)(pLabel->section); sym.value = pLabel->value; sym.local = local; pLabel->mapIndex = pLabel->evaluated ? -1 : (int)map.size(); map.push_back(sym); } } // Add a label entry Label* Asm::AddLabel(uint32_t hash) { uint32_t index = FindLabelIndex(hash, labels.getKeys(), labels.count()); labels.insert(index, hash); return labels.getValues() + index; } // mark a label as a local label void Asm::MarkLabelLocal(strref label, bool scope_reserve) { LocalLabelRecord rec; rec.label = label; rec.scope_depth = scope_depth; rec.scope_reserve = scope_reserve; localLabels.push_back(rec); } // find all local labels or up to given scope level and remove them StatusCode Asm::FlushLocalLabels(int scope_exit) { StatusCode status = STATUS_OK; // iterate from end of local label records and early out if the label scope is lower than the current. std::vector::iterator i = localLabels.end(); while (i!=localLabels.begin()) { --i; if (i->scope_depthlabel; StatusCode this_status = CheckLateEval(label); if (this_status>FIRST_ERROR) { status = this_status; } if (!i->scope_reserve || i->scope_depth<=scope_exit) { uint32_t index = FindLabelIndex(label.fnv1a(), labels.getKeys(), labels.count()); while (index>4; if (ranges>2||num32>((MAX_POOL_BYTES+15)>>4)) { return ERROR_POOL_RANGE_EXPRESSION_EVAL; } } if (!ranges) { return ERROR_POOL_RANGE_EXPRESSION_EVAL; } LabelPool pool; pool.pool_name = name; pool.numRanges = (int16_t)(ranges>>1); pool.depth = 0; pool.start = aRng[0]; pool.end = aRng[1]; labelPools.insert(ins, pool_hash); LabelPool &poolValue = labelPools.getValue(ins); poolValue = pool; return STATUS_OK; } StatusCode Asm::AssignPoolLabel(LabelPool &pool, strref label) { if (pool_subpool.is_prefix_word(label)) { // declaring a pool within another pool? label += pool_subpool.get_len(); label.skip_whitespace(); strref size = label; label = size.split_label(); if (strref::is_number(size.get_first())) { uint16_t bytes = (uint16_t)size.atoi(); if (!bytes) { return ERROR_POOL_RANGE_EXPRESSION_EVAL; } if (!GetLabelPool(label)) { uint16_t addr; StatusCode error = pool.Reserve(bytes, addr, (uint16_t)brace_depth); if( error == STATUS_OK ) { // permanently remove this chunk from the parent pool pool.end = addr; pool.depth = 0; uint32_t pool_hash = label.fnv1a(); uint32_t ins = FindLabelIndex(pool_hash, labelPools.getKeys(), labelPools.count()); labelPools.insert(ins, pool_hash); LabelPool &subPool = labelPools.getValue(ins); subPool.pool_name = label; subPool.numRanges = 1; subPool.depth = 0; subPool.start = addr; subPool.end = addr+bytes; } return error; } else { return ERROR_LABEL_POOL_REDECLARATION; } } return ERROR_POOL_RANGE_EXPRESSION_EVAL; } strref type = label; uint16_t bytes = 1; int sz = label.find_at( '.', 1 ); if (sz > 0) { label = type.split( sz ); ++type; if (strref::is_number(type.get_first())) { bytes = (uint16_t)type.atoi(); } else { switch (strref::tolower(type.get_first())) { case 'l': bytes = 4; break; case 't': bytes = 3; break; case 'd': case 'w': bytes = 2; break; } } } if (GetLabel(label)) { return ERROR_POOL_LABEL_ALREADY_DEFINED; } uint16_t addr; StatusCode error = pool.Reserve(bytes, addr, (uint16_t)brace_depth); if (error!=STATUS_OK) { return error; } Label *pLabel = AddLabel(label.fnv1a()); pLabel->label_name = label; pLabel->pool_name = pool.pool_name; pLabel->evaluated = true; pLabel->section = -1; // pool labels are section-less pLabel->value = addr; pLabel->pc_relative = true; pLabel->constant = true; pLabel->external = false; pLabel->reference = false; bool local = false; if (label[ 0 ] == '.' || label[ 0 ] == '@' || label[ 0 ] == '!' || label[ 0 ] == ':' || label.get_last() == '$') { local = true; MarkLabelLocal( label, true ); } LabelAdded(pLabel, local); return error; } // Request a label from a pool StatusCode LabelPool::Reserve(uint16_t numBytes, uint16_t &ret_addr, uint16_t scope) { if (numBytes>(end-start)||depth==MAX_SCOPE_DEPTH) { return ERROR_OUT_OF_LABELS_IN_POOL; } if (!depth||scope!=scopeUsed[depth-1][1]) { scopeUsed[depth][0] = end; scopeUsed[depth][1] = scope; ++depth; } end -= numBytes; ret_addr = end; return STATUS_OK; } // Release a label from a pool (at scope closure) void LabelPool::ExitScope(uint16_t scope) { if (depth && scopeUsed[depth-1][1]==scope) { end = scopeUsed[--depth][0]; } } // Check if a label is marked as an xdef bool Asm::MatchXDEF(strref label) { uint32_t hash = label.fnv1a(); uint32_t pos = FindLabelIndex(hash, xdefs.getKeys(), xdefs.count()); while (pos < xdefs.count() && xdefs.getKey(pos) == hash) { if (label.same_str_case(xdefs.getValue(pos))) { return true; } ++pos; } return false; } // assignment of label ( = ) StatusCode Asm::AssignLabel(strref label, strref line, bool make_constant) { line.trim_whitespace(); int val = 0; struct EvalContext etx; SetEvalCtxDefaults(etx); StatusCode status = EvalExpression(line, etx, val); if (status!=STATUS_NOT_READY && status!=STATUS_OK && status!=STATUS_RELATIVE_SECTION) { return status; } Label *pLabel = GetLabel(label); if (pLabel) { if (pLabel->constant && pLabel->evaluated && val!=pLabel->value) { return (status==STATUS_NOT_READY) ? STATUS_OK : ERROR_MODIFYING_CONST_LABEL; } } else { pLabel = AddLabel(label.fnv1a()); } pLabel->label_name = label; pLabel->pool_name.clear(); pLabel->evaluated = status==STATUS_OK || status == STATUS_RELATIVE_SECTION; pLabel->section = status == STATUS_RELATIVE_SECTION ? lastEvalSection : -1; // assigned labels are section-less pLabel->value = val; pLabel->mapIndex = -1; pLabel->pc_relative = false; pLabel->constant = make_constant; pLabel->external = MatchXDEF(label); pLabel->reference = false; bool local = label[0]=='.' || label[0]=='@' || label[0]=='!' || label[0]==':' || label.get_last()=='$'; if (!pLabel->evaluated) { AddLateEval(label, CurrSection().GetPC(), scope_address[scope_depth], line, LateEval::LET_LABEL); } else { if (local) { MarkLabelLocal(label); } LabelAdded(pLabel, local); return CheckLateEval(label); } return STATUS_OK; } // Adding a fixed address label StatusCode Asm::AddressLabel(strref label) { StatusCode status = STATUS_OK; Label *pLabel = GetLabel(label); bool constLabel = false; if (!pLabel) { pLabel = AddLabel(label.fnv1a()); } else if (pLabel->constant && pLabel->value!=CurrSection().GetPC()) { return ERROR_MODIFYING_CONST_LABEL; } else { constLabel = pLabel->constant; } pLabel->label_name = label; pLabel->pool_name.clear(); pLabel->section = CurrSection().IsRelativeSection() ? SectionId() : -1; // address labels are based on section pLabel->value = CurrSection().GetPC(); pLabel->evaluated = true; pLabel->pc_relative = true; pLabel->external = MatchXDEF(label); pLabel->reference = false; pLabel->constant = constLabel; last_label = label; bool local = label[0]=='.' || label[0]=='@' || label[0]=='!' || label[0]==':' || label.get_last()=='$'; LabelAdded(pLabel, local); if (local) { MarkLabelLocal(label); } status = CheckLateEval(label); if (!local && label[0]!=']') { // MERLIN: Variable label does not invalidate local labels StatusCode this_status = FlushLocalLabels(); if (status=FIRST_ERROR) { status = this_status; } } return status; } // include symbols listed from a .sym file or all if no listing StatusCode Asm::IncludeSymbols(strref line) { strref symlist = line.before('"').get_trimmed_ws(); line = line.between('"', '"'); size_t size; if (char *buffer = LoadText(line, size)) { strref symfile(buffer, strl_t(size)); while (symfile) { symfile.skip_whitespace(); strref symstart = symfile; if (strref symline = symfile.line()) { int scope_start = symline.find('{'); if (scope_start != 0) { strref symdef = symline.get_substr(0, scope_start); symdef.clip_trailing_whitespace(); strref symtype = symdef.split_token(' '); strref label = symdef.split_token_trim('='); bool constant = symtype.same_str(".const"); // first word is either .label or .const if (symlist) { strref symchk = symlist; while (strref symwant = symchk.split_token_trim(',')) { if (symwant.same_str_case(label)) { AssignLabel(label, symdef, constant); break; } } } else AssignLabel(label, symdef, constant); } if (scope_start >= 0) { symfile = symstart + scope_start; symfile.scoped_block_skip(); } } } loadedData.push_back(buffer); } else return ERROR_COULD_NOT_INCLUDE_FILE; return STATUS_OK; } // Get a string record if it exists StringSymbol *Asm::GetString(strref string_name) { uint32_t string_hash = string_name.fnv1a(); uint32_t index = FindLabelIndex(string_hash, strings.getKeys(), strings.count()); while (index < strings.count() && string_hash == strings.getKey(index)) { if (string_name.same_str(strings.getValue(index).string_name)) return strings.getValues() + index; index++; } return nullptr; } // Add or modify a string record StringSymbol *Asm::AddString(strref string_name, strref string_value) { StringSymbol *pStr = GetString(string_name); if (pStr==nullptr) { uint32_t string_hash = string_name.fnv1a(); uint32_t index = FindLabelIndex(string_hash, strings.getKeys(), strings.count()); strings.insert(index, string_hash); pStr = strings.getValues() + index; pStr->string_name = string_name; pStr->string_value.invalidate(); pStr->string_value.clear(); } if (pStr->string_value.cap()) { free(pStr->string_value.charstr()); pStr->string_value.invalidate(); pStr->string_value.clear(); } pStr->string_const = string_value; return pStr; } // append a string to another string StatusCode StringSymbol::Append(strref append) { if (!append) return STATUS_OK; strl_t add_len = append.get_len(); if (!string_value.cap()) { strl_t new_len = (add_len + 0xff)&(~(strl_t)0xff); char *buf = (char*)malloc(new_len); if (!buf) return ERROR_OUT_OF_MEMORY; string_value.set_overlay(buf, new_len); string_value.copy(string_const); } else if (string_value.cap() < (string_value.get_len() + add_len)) { strl_t new_len = (string_value.get_len() + add_len + 0xff)&(~(strl_t)0xff); char *buf = (char*)malloc(new_len); if (!buf) return ERROR_OUT_OF_MEMORY; strovl ovl(buf, new_len); ovl.copy(string_value.get_strref()); free(string_value.charstr()); string_value.set_overlay(buf, new_len); } string_const.clear(); string_value.append(append); return STATUS_OK; } StatusCode Asm::ParseStringOp(StringSymbol *pStr, strref line) { line.skip_whitespace(); if (line[0] == '+') ++line; for (;;) { line.skip_whitespace(); if (line[0] == '"') { strref substr = line.between('"', '"'); line += substr.get_len() + 2; pStr->Append(substr); } else { strref label = line.split_range(Merlin() ? label_end_char_range_merlin : label_end_char_range); if (StringSymbol *pStr2 = GetString(label)) pStr->Append(pStr2->get()); else if (Label *pLabel = GetLabel(label)) { if (!pLabel->evaluated) return ERROR_TARGET_ADDRESS_MUST_EVALUATE_IMMEDIATELY; strown<32> lblstr; lblstr.sprintf("$%x", pLabel->value); pStr->Append(lblstr.get_strref()); } else break; } line.skip_whitespace(); if (!line || line[0] != '+') break; ++line; line.skip_whitespace(); } return STATUS_OK; } StatusCode Asm::StringAction(StringSymbol *pStr, strref line) { line.skip_whitespace(); if (line[0] == '+' && line[1] == '=') { // append strings line += 2; line.skip_whitespace(); return ParseStringOp(pStr, line); } else if (line[0] == '=') { ++line; line.skip_whitespace(); pStr->clear(); return ParseStringOp(pStr, line); } strref str = pStr->string_value.valid() ? pStr->string_value.get_strref() : pStr->string_const; if (!str) { return STATUS_OK; } char *macro = (char*)malloc(str.get_len()); strovl mac(macro, str.get_len()); mac.copy(str); mac.replace("\\n", "\n"); loadedData.push_back(macro); PushContext(contextStack.curr().source_name, mac.get_strref(), mac.get_strref()); return STATUS_OK; } // // // CONDITIONAL ASSEMBLY // // // Encountered #if or #ifdef, return true if assembly is enabled bool Asm::NewConditional() { if (conditional_nesting[conditional_depth]) { conditional_nesting[conditional_depth]++; return false; } return true; } // Encountered #endif, close out the current conditional void Asm::CloseConditional() { if (conditional_depth>contextStack.curr().conditional_ctx) conditional_depth--; else conditional_consumed[conditional_depth] = false; } // Check if this conditional will nest the assembly (a conditional is already consumed) void Asm::CheckConditionalDepth() { if (conditional_consumed[conditional_depth]) { conditional_depth++; conditional_source[conditional_depth] = contextStack.curr().read_source.get_line(); conditional_consumed[conditional_depth] = false; conditional_nesting[conditional_depth] = 0; } } // This conditional block is going to be assembled, mark it as consumed void Asm::ConsumeConditional() { conditional_source[conditional_depth] = contextStack.curr().read_source.get_line(); conditional_consumed[conditional_depth] = true; } // This conditional block is not going to be assembled so mark that it is nesting void Asm::SetConditional() { conditional_source[conditional_depth] = contextStack.curr().read_source.get_line(); conditional_nesting[conditional_depth] = 1; } // Returns true if assembly is currently enabled bool Asm::ConditionalAsm() { return conditional_nesting[conditional_depth]==0; } // Returns true if this conditional has a block that has already been assembled bool Asm::ConditionalConsumed() { return conditional_consumed[conditional_depth]; } // Returns true if this conditional can be consumed bool Asm::ConditionalAvail() { return conditional_nesting[conditional_depth]==1 && !conditional_consumed[conditional_depth]; } // This conditional block is enabled and the prior wasn't void Asm::EnableConditional(bool enable) { if (enable) { conditional_nesting[conditional_depth] = 0; conditional_consumed[conditional_depth] = true; } } // Conditional else that does not enable block void Asm::ConditionalElse() { if (conditional_consumed[conditional_depth]) conditional_nesting[conditional_depth]++; } // Conditional statement evaluation (true/false) StatusCode Asm::EvalStatement(strref line, bool &result) { struct EvalContext etx; SetEvalCtxDefaults(etx); bool invert = line.get_first()=='!'; if (invert) ++line; int value; if (STATUS_OK != EvalExpression(line, etx, value)) return ERROR_CONDITION_COULD_NOT_BE_RESOLVED; result = (value!=0 && !invert) || (value==0 && invert); return STATUS_OK; } // Add a folder for including files void Asm::AddIncludeFolder(strref path) { if (!path) return; for (std::vector::const_iterator i = includePaths.begin(); i!=includePaths.end(); ++i) { if (path.same_str(*i)) return; } if (includePaths.size()==includePaths.capacity()) includePaths.reserve(includePaths.size() + 16); includePaths.push_back(path); } // unique key binary search int LookupOpCodeIndex(uint32_t hash, OPLookup *lookup, int count) { int first = 0; while (count!=first) { int index = (first+count)/2; uint32_t read = lookup[index].op_hash; if (hash==read) { return index; } else if (hash>read) first = index+1; else count = index; } return -1; // index not found } // Encountered a REPT or LUP StatusCode Asm::Directive_Rept(strref line) { SourceContext &ctx = contextStack.curr(); strref read_source = ctx.read_source; if (read_source.is_substr(line.get())) { read_source.skip(strl_t(line.get() - read_source.get())); strref expression; if (Merlin() || end_macro_directive) { expression = line; // Merlin repeat body begins next line read_source.line(); } else { int block = read_source.find('{'); if (block<0) return ERROR_REPT_MISSING_SCOPE; expression = read_source.get_substr(0, block); read_source += block; read_source.skip_whitespace(); } expression.trim_whitespace(); int count; struct EvalContext etx; SetEvalCtxDefaults(etx); if (STATUS_OK != EvalExpression(expression, etx, count)) return ERROR_REPT_COUNT_EXPRESSION; strref recur; if (Merlin() || end_macro_directive) { recur = read_source; // Merlin repeat body ends at "--^" while (strref next_line = read_source.line()) { next_line = next_line.before_or_full(';'); next_line = next_line.before_or_full(c_comment); int term = next_line.find(end_macro_directive ? "endr" : "--^"); if (term >= 0) { recur = recur.get_substr(0, strl_t(next_line.get() + term - recur.get())); break; } } } else recur = read_source.scoped_block_skip(); ctx.next_source = read_source; PushContext(ctx.source_name, ctx.source_file, recur, count); } return STATUS_OK; } // macro: create an assembler macro StatusCode Asm::Directive_Macro(strref line) { strref read_source = contextStack.curr().read_source.get_skip_ws(); if (!Merlin() && read_source.is_substr(line.get())) read_source.skip(strl_t(line.get()-read_source.get())); if (read_source) { StatusCode error = AddMacro(read_source, contextStack.curr().source_name, contextStack.curr().source_file, read_source); contextStack.curr().next_source = read_source; return error; } return STATUS_OK; } // string: create a symbolic string StatusCode Asm::Directive_String(strref line) { line.skip_whitespace(); strref string_name = line.split_range_trim(word_char_range, line[0]=='.' ? 1 : 0); if (line[0]=='=' || keyword_equ.is_prefix_word(line)) { line.next_word_ws(); strref substr = line; if (line[0] == '"') { substr = line.between('"', '"'); line += substr.get_len() + 2; StringSymbol *pStr = AddString(string_name, substr); if (pStr == nullptr) return ERROR_OUT_OF_MEMORY; line.skip_whitespace(); if (line[0] == '+') return ParseStringOp(pStr, line); } else { StringSymbol *pStr = AddString(string_name, strref()); return ParseStringOp(pStr, line); } } else { if (!AddString(string_name, strref())) return ERROR_OUT_OF_MEMORY; } return STATUS_OK; } StatusCode Asm::Directive_Undef(strref line) { strref name = line.split_range_trim(Merlin() ? label_end_char_range_merlin : label_end_char_range); uint32_t name_hash = name.fnv1a(); uint32_t index = FindLabelIndex(name_hash, labels.getKeys(), labels.count()); while (index < labels.count() && name_hash == labels.getKey(index)) { if (name.same_str(labels.getValue(index).label_name)) { labels.remove(index); return STATUS_OK; } index++; } index = FindLabelIndex(name_hash, strings.getKeys(), strings.count()); while (index < strings.count() && name_hash == strings.getKey(index)) { if (name.same_str(strings.getValue(index).string_name)) { StringSymbol str = strings.getValue(index); if (str.string_value.cap()) { free(str.string_value.charstr()); str.string_value.invalidate(); } strings.remove(index); return STATUS_OK; } index++; } return STATUS_OK; } // include: read in a source file and assemble at this point StatusCode Asm::Directive_Include(strref line) { strref file = line.between('"', '"'); if (!file) // MERLIN: No quotes around PUT filenames file = line.split_range(filename_end_char_range); size_t size = 0; char *buffer = LoadText(file, size); if (buffer) { loadedData.push_back(buffer); strref src(buffer, strl_t(size)); PushContext(file, src, src); } else if (Merlin()) { // MERLIN include file name rules if (file[0] >= '!' && file[0] <= '&') buffer = LoadText(file + 1, size); if (buffer) { loadedData.push_back(buffer); // MERLIN: prepend with !-& to not auto-prepend with T. strref src(buffer, strl_t(size)); PushContext(file+1, src, src); } else { strown<512> fileadd(file[0]>='!' && file[0]<='&' ? (file+1) : file); fileadd.append(".s"); buffer = LoadText(fileadd.get_strref(), size); if (buffer) { loadedData.push_back(buffer); // MERLIN: !+filename appends .S to filenames strref src(buffer, strl_t(size)); PushContext(file, src, src); } else { fileadd.copy("T."); // MERLIN: just filename prepends T. to filenames fileadd.append(file[0]>='!' && file[0]<='&' ? (file+1) : file); buffer = LoadText(fileadd.get_strref(), size); if (buffer) { loadedData.push_back(buffer); strref src(buffer, strl_t(size)); PushContext(file, src, src); } } } } if (!size) return ERROR_COULD_NOT_INCLUDE_FILE; return STATUS_OK; } // incbin: import binary data in place StatusCode Asm::Directive_Incbin(strref line, int skip, int len) { line = line.between('"', '"'); strown<512> filename(line); size_t size = 0; if (char *buffer = LoadBinary(line, size)) { int bin_size = (int)size - skip; if (len && bin_size>len) bin_size = len; if (bin_size>0) AddBin((const uint8_t*)buffer+skip, bin_size); free(buffer); return STATUS_OK; } return ERROR_COULD_NOT_INCLUDE_FILE; } // import is a catch-all file reference StatusCode Asm::Directive_Import(strref line) { line.skip_whitespace(); int skip = 0; // binary import skip this amount int len = 0; // binary import load up to this amount strref param; // read out skip & max len parameters int q = line.find('"'); if (q>=0) { param = line + q; param.scoped_block_skip(); param.trim_whitespace(); if (param[0]==',') { ++param; param.skip_whitespace(); if (param) { struct EvalContext etx; SetEvalCtxDefaults(etx); EvalExpression(param.split_token_trim(','), etx, skip); if (param) { EvalExpression(param, etx, len); } } } } if (line[0]=='"') return Directive_Incbin(line); else if (import_source.is_prefix_word(line)) { line += import_source.get_len(); line.skip_whitespace(); return Directive_Include(line); } else if (import_binary.is_prefix_word(line)) { line += import_binary.get_len(); line.skip_whitespace(); return Directive_Incbin(line, skip, len); } else if (import_c64.is_prefix_word(line)) { line += import_c64.get_len(); line.skip_whitespace(); return Directive_Incbin(line, 2+skip, len); // 2 = load address skip size } else if (import_text.is_prefix_word(line)) { line += import_text.get_len(); line.skip_whitespace(); strref text_type = "petscii"; while (line[0]!='"') { strref word = line.get_word_ws(); if (word.same_str("petscii") || word.same_str("petscii_shifted")) { text_type = line.get_word_ws(); line += text_type.get_len(); line.skip_whitespace(); } else if (StringSymbol *pStr = GetString(line.get_word_ws())) { line = pStr->get(); break; } } CurrSection().AddText(line, text_type); return STATUS_OK; } else if (import_object.is_prefix_word(line)) { line += import_object.get_len(); line.trim_whitespace(); return ReadObjectFile(line[0]=='"' ? line.between('"', '"') : line); } else if (import_symbols.is_prefix_word(line)) { line += import_symbols.get_len(); line.skip_whitespace(); return IncludeSymbols(line); } return STATUS_OK; } // org / pc: current address of code StatusCode Asm::Directive_ORG(strref line) { int addr; if (line[0]=='=') ++line; else if (keyword_equ.is_prefix_word(line)) // optional '=' or equ line.next_word_ws(); line.skip_whitespace(); struct EvalContext etx; SetEvalCtxDefaults(etx); StatusCode error = EvalExpression(line, etx, addr); if (error != STATUS_OK) return (error == STATUS_NOT_READY || error == STATUS_XREF_DEPENDENT) ? ERROR_TARGET_ADDRESS_MUST_EVALUATE_IMMEDIATELY : error; // Section immediately followed by ORG reassigns that section to be fixed Section &currSection = CurrSection(); if (currSection.size()==0 && !currSection.IsDummySection() && !currSection.address_assigned) { if (currSection.type == ST_ZEROPAGE && addr >= 0x100) return ERROR_ZEROPAGE_SECTION_OUT_OF_RANGE; AssignAddressToSection(SectionId(), addr); } else SetSection(strref(), addr); return STATUS_OK; } // load: address for target to load code at StatusCode Asm::Directive_LOAD(strref line) { int addr; if (line[0]=='=' || keyword_equ.is_prefix_word(line)) line.next_word_ws(); struct EvalContext etx; SetEvalCtxDefaults(etx); StatusCode error = EvalExpression(line, etx, addr); if (error != STATUS_OK) return (error == STATUS_NOT_READY || error == STATUS_XREF_DEPENDENT) ? ERROR_TARGET_ADDRESS_MUST_EVALUATE_IMMEDIATELY : error; CurrSection().SetLoadAddress(addr); return STATUS_OK; } StatusCode Asm::Directive_MERGE(strref line) { int first_section = -1; strref section_name = line.split_label(); // get the first section that matches the first name and has an assigned address for (size_t section_id = 0; section_id!=allSections.size(); ++section_id) { const Section §ion = allSections[section_id]; if (!section.IsMergedSection()&§ion.name.same_str(section_name)) { if (first_section<0||!allSections[first_section].IsRelativeSection()) { first_section = (int)section_id; } } } if (first_section<0) { return ERROR_NOT_A_SECTION; } // merge all sections as defined by the line while (section_name) { for (size_t section_id = 0; section_id!=allSections.size(); ++section_id) { const Section §ion = allSections[section_id]; if (section_id!=first_section&&!section.IsMergedSection()&§ion.IsRelativeSection()) { if (section.name.same_str(section_name)) { StatusCode result = MergeSections(first_section, (int)section_id); if (result!=STATUS_OK) { return result; } } } } if (line[0]==',') { ++line; } section_name = line.split_label(); } return STATUS_OK; } // MERLIN version of AD_LINK, which is more like AD_INCOBJ + link to current section StatusCode Asm::Directive_LNK(strref line) { strref file = line.between('"', '"'); if (!file) // MERLIN: No quotes around include filenames file = line.split_range(filename_end_char_range); int section_id = SectionId(); StatusCode error = ReadObjectFile(file, SectionId()); // restore current section current_section = &allSections[section_id]; return error; } // this stores a string that when matched with a label will make that label external StatusCode Asm::Directive_XDEF(strref line) { line.trim_whitespace(); if (strref xdef = line.split_range(Merlin() ? label_end_char_range_merlin : label_end_char_range)) { char f = xdef.get_first(); char e = xdef.get_last(); if (f != '.' && f != '!' && f != '@' && e != '$') { uint32_t hash = xdef.fnv1a(); uint32_t pos = FindLabelIndex(hash, xdefs.getKeys(), xdefs.count()); while (pos < xdefs.count() && xdefs.getKey(pos) == hash) { if (xdefs.getValue(pos).same_str_case(xdef)) return STATUS_OK; ++pos; } xdefs.insert(pos, hash); xdefs.getValues()[pos] = xdef; } } return STATUS_OK; } StatusCode Asm::Directive_XREF(strref label) { // XREF already defined label => no action if (!GetLabel(label)) { Label *pLabelXREF = AddLabel(label.fnv1a()); pLabelXREF->label_name = label; pLabelXREF->pool_name.clear(); pLabelXREF->section = -1; // address labels are based on section pLabelXREF->value = 0; pLabelXREF->evaluated = true; pLabelXREF->pc_relative = true; pLabelXREF->external = false; pLabelXREF->constant = false; pLabelXREF->reference = true; } return STATUS_OK; } // dc.b, dc.w, dc.t, dc.l, ADR, ADRL, bytes, words, long StatusCode Asm::Directive_DC(strref line, int width, strref source_file) { struct EvalContext etx; SetEvalCtxDefaults(etx); line.trim_whitespace(); while (strref exp_dc = line.split_token_trim(',')) { int value = 0; if (!CurrSection().IsDummySection()) { if (Merlin() && exp_dc.get_first() == '#') // MERLIN allows for an immediate declaration on data ++exp_dc; StatusCode error = EvalExpression(exp_dc, etx, value); if (error > STATUS_XREF_DEPENDENT) break; else if (error == STATUS_NOT_READY || error == STATUS_XREF_DEPENDENT) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], exp_dc, source_file, width == 1 ? LateEval::LET_BYTE : (width == 2 ? LateEval::LET_ABS_REF : (width == 3 ? LateEval::LET_ABS_L_REF : LateEval::LET_ABS_4_REF))); else if (error == STATUS_RELATIVE_SECTION) { value = 0; CurrSection().AddReloc(lastEvalValue, CurrSection().DataOffset(), lastEvalSection, (int8_t)width, (int8_t)lastEvalShift); } } uint8_t bytes[4] = { (uint8_t)value, (uint8_t)(value >> 8), (uint8_t)(value >> 16), (uint8_t)(value >> 24) }; AddBin(bytes, width); } return STATUS_OK; } // ds/ds.b/ds.w/ds.t/ds.l StatusCode Asm::Directive_DS(strref line) { int width = 1; int value; if (line.get_first() == '.' && strref::is_alphabetic(line[1])) { switch (strref::tolower(line[1])) { case 'b': break; case 'w': width = 2; break; case 't': width = 3; break; case 'l': width = 4; break; } line += 2; line.skip_whitespace(); } struct EvalContext etx; SetEvalCtxDefaults(etx); strref size = line.split_token_trim(','); if (STATUS_OK != EvalExpression(size, etx, value)) return ERROR_DS_MUST_EVALUATE_IMMEDIATELY; int fill = 0; if (line && STATUS_OK != EvalExpression(line, etx, fill)) return ERROR_DS_MUST_EVALUATE_IMMEDIATELY; value *= width; if (value > 0) { for (int n = 0; n < value; n++) AddByte(fill); } else if (value) { CurrSection().AddAddress(value); if (CurrSection().type == ST_ZEROPAGE && CurrSection().address > 0x100) return ERROR_ZEROPAGE_SECTION_OUT_OF_RANGE; } return STATUS_OK; } StatusCode Asm::Directive_ALIGN(strref line) { if (line) { if (line[0] == '=' || keyword_equ.is_prefix_word(line)) line.next_word_ws(); struct EvalContext etx; SetEvalCtxDefaults(etx); int value; int status = EvalExpression(line, etx, value); if (status == STATUS_NOT_READY || status == STATUS_XREF_DEPENDENT) return ERROR_ALIGN_MUST_EVALUATE_IMMEDIATELY; if (status == STATUS_OK && value>0) { if (CurrSection().address_assigned) { int add = (CurrSection().GetPC() + value - 1) % value; for (int a = 0; a < add; a++) AddByte(0); } else CurrSection().align_address = value; } } return STATUS_OK; } StatusCode Asm::Directive_EVAL(strref line) { int value = 0; strref description = line.find(':') >= 0 ? line.split_token_trim(':') : strref(); line.trim_whitespace(); struct EvalContext etx; SetEvalCtxDefaults(etx); strref lab1 = line; lab1 = lab1.split_token_any_trim(Merlin() ? label_end_char_range_merlin : label_end_char_range); StringSymbol *pStr = line.same_str_case(lab1) ? GetString(lab1) : nullptr; if (line && EvalExpression(line, etx, value) == STATUS_OK) { if (description) { if (pStr != nullptr) { printf("EVAL(%d): " STRREF_FMT ": \"" STRREF_FMT "\" = \"" STRREF_FMT "\" = $%x\n", contextStack.curr().source_file.count_lines(description) + 1, STRREF_ARG(description), STRREF_ARG(line), STRREF_ARG(pStr->get()), value); } else { printf("EVAL(%d): " STRREF_FMT ": \"" STRREF_FMT "\" = $%x\n", contextStack.curr().source_file.count_lines(description) + 1, STRREF_ARG(description), STRREF_ARG(line), value); } } else { if (pStr != nullptr) { printf("EVAL(%d): \"" STRREF_FMT "\" = \"" STRREF_FMT "\" = $%x\n", contextStack.curr().source_file.count_lines(line) + 1, STRREF_ARG(line), STRREF_ARG(pStr->get()), value); } else { printf("EVAL(%d): \"" STRREF_FMT "\" = $%x\n", contextStack.curr().source_file.count_lines(line) + 1, STRREF_ARG(line), value); } } } else if (description) { if (pStr != nullptr) { printf("EVAL(%d): " STRREF_FMT ": \"" STRREF_FMT "\" = \"" STRREF_FMT "\"\n", contextStack.curr().source_file.count_lines(description) + 1, STRREF_ARG(description), STRREF_ARG(line), STRREF_ARG(pStr->get())); } else { printf("EVAL(%d): \"" STRREF_FMT ": " STRREF_FMT"\"\n", contextStack.curr().source_file.count_lines(description) + 1, STRREF_ARG(description), STRREF_ARG(line)); } } else { if (pStr != nullptr) { printf("EVAL(%d): \"" STRREF_FMT "\" = \"" STRREF_FMT "\"\n", contextStack.curr().source_file.count_lines(line) + 1, STRREF_ARG(line), STRREF_ARG(pStr->get())); } else { printf("EVAL(%d): \"" STRREF_FMT "\"\n", contextStack.curr().source_file.count_lines(line) + 1, STRREF_ARG(line)); } } return STATUS_OK; } StatusCode Asm::Directive_HEX(strref line) { uint8_t b = 0, v = 0; while (line) { // indeterminable length, can't read hex to int char c = *line.get(); ++line; if (c == ',') { if (b) // probably an error but seems safe AddByte(v); b = 0; line.skip_whitespace(); } else { if (c >= '0' && c <= '9') v = (v << 4) + (c - '0'); else if (c >= 'A' && c <= 'Z') v = (v << 4) + (c - 'A' + 10); else if (c >= 'a' && c <= 'z') v = (v << 4) + (c - 'a' + 10); else break; b ^= 1; if (!b) AddByte(v); } } if (b) return ERROR_HEX_WITH_ODD_NIBBLE_COUNT; return STATUS_OK; } StatusCode Asm::Directive_ENUM_STRUCT(strref line, AssemblerDirective dir) { strref read_source = contextStack.curr().read_source; if (read_source.is_substr(line.get())) { strref struct_name = line.get_word(); line.skip(struct_name.get_len()); line.skip_whitespace(); read_source.skip(strl_t(line.get() - read_source.get())); if (read_source[0] == '{') { if (dir == AD_STRUCT) BuildStruct(struct_name, read_source.scoped_block_skip()); else BuildEnum(struct_name, read_source.scoped_block_skip()); } else return dir == AD_STRUCT ? ERROR_STRUCT_CANT_BE_ASSEMBLED : ERROR_ENUM_CANT_BE_ASSEMBLED; contextStack.curr().next_source = read_source; } else return ERROR_STRUCT_CANT_BE_ASSEMBLED; return STATUS_OK; } // Action based on assembler directive StatusCode Asm::ApplyDirective(AssemblerDirective dir, strref line, strref source_file) { StatusCode error = STATUS_OK; if (!ConditionalAsm()) { // If conditionally blocked from assembling only check conditional directives if (dir!=AD_IF && dir!=AD_IFDEF && dir!=AD_ELSE && dir!=AD_ELIF && dir!=AD_ELSE && dir!=AD_ENDIF) return STATUS_OK; } struct EvalContext etx; SetEvalCtxDefaults(etx); switch (dir) { case AD_CPU: for (int c = 0; c < nCPUs; c++) { if (line.same_str(aCPUs[c].name)) { if (c != cpu) SetCPU((CPUIndex)c); return STATUS_OK; } } return ERROR_CPU_NOT_SUPPORTED; case AD_EXPORT: line.trim_whitespace(); CurrSection().export_append = line.split_label(); break; case AD_ORG: return Directive_ORG(line); case AD_LOAD: return Directive_LOAD(line); case AD_SECTION: SetSection(line); break; case AD_MERGE: return Directive_MERGE(line); case AD_LINK: return LinkSections(line.get_trimmed_ws()); case AD_LNK: return Directive_LNK(line); case AD_INCOBJ: { strref file = line.between('"', '"'); if (!file) // MERLIN: No quotes around include filenames file = line.split_range(filename_end_char_range); error = ReadObjectFile(file); break; } case AD_XDEF: return Directive_XDEF(line.get_trimmed_ws()); case AD_XREF: Directive_XREF(line.split_range_trim( Merlin() ? label_end_char_range_merlin : label_end_char_range)); break; case AD_ENT: // MERLIN version of xdef, makes most recently defined label external if (Label *pLastLabel = GetLabel(last_label)) pLastLabel->external = true; break; case AD_EXT: Directive_XREF(last_label); break; case AD_ALIGN: // align: align address to multiple of value, fill space with 0 return Directive_ALIGN(line); case AD_EVAL: // eval: display the result of an expression in stdout return Directive_EVAL(line); case AD_BYTES: // bytes: add bytes by comma separated values/expressions return Directive_DC(line, 1, source_file); case AD_WORDS: // words: add words (16 bit values) by comma separated values return Directive_DC(line, 2, source_file); case AD_ADR: // ADR: MERLIN store 3 byte word return Directive_DC(line, 3, source_file); case AD_ADRL: // ADRL: MERLIN store 4 byte word return Directive_DC(line, 4, source_file); case AD_DC: { int width = 1; if (line[0]=='.') { ++line; switch (strref::tolower(line.get_first())) { case 'b': width = 1; break; case 'w': width = 2; break; case 't': width = 3; break; case 'l': width = 4; break; default: return ERROR_BAD_TYPE_FOR_DECLARE_CONSTANT; } ++line; } return Directive_DC(line, width, source_file); } case AD_HEX: return Directive_HEX(line); case AD_EJECT: line.clear(); break; case AD_USR: line.clear(); break; case AD_CYC: list_flags |= cycle_counter_level ? ListLine::CYCLES_STOP : ListLine::CYCLES_START; cycle_counter_level = !!cycle_counter_level; break; case AD_SAV: line.trim_whitespace(); if (line.has_prefix(export_base_name)) line.skip(export_base_name.get_len()); if (line) CurrSection().export_append = line.split_label(); AssignAddressToGroup(); break; case AD_XC: // XC: MERLIN version of setting CPU if (strref("off").is_prefix_word(line)) SetCPU(CPU_6502); else if (strref("xc").is_prefix_word(line)) SetCPU(CPU_65816); else if (cpu==CPU_65C02) SetCPU(CPU_65816); else SetCPU(CPU_65C02); break; case AD_TEXT: { // text: add text within quotes strref text_prefix; if (line[0]=='[') { strref str = line.scoped_block_skip().get_trimmed_ws(); if (StringSymbol *StringSym = GetString(str)) { line.skip_whitespace(); if (line[0] == '"') line = line.between('"', '"'); CurrSection().AddIndexText(StringSym, line); break; } } while (line[0] != '"') { strref word = line.get_word_ws(); if (word.same_str("petscii") || word.same_str("petscii_shifted")) { text_prefix = line.get_word_ws(); line += text_prefix.get_len(); line.skip_whitespace(); } else if (StringSymbol *pStr = GetString(line.get_word_ws())) { line = pStr->get(); break; } } if (line[0] == '"') line = line.between('"', '"'); CurrSection().AddText(line, text_prefix); break; } case AD_MACRO: error = Directive_Macro(line); break; case AD_INCLUDE: // assemble another file in place return Directive_Include(line); case AD_INCBIN: return Directive_Incbin(line); case AD_IMPORT: return Directive_Import(line); case AD_LABEL: case AD_CONST: { line.trim_whitespace(); strref label = line.split_range_trim(word_char_range, line[0]=='.' ? 1 : 0); if (line[0]=='=' || keyword_equ.is_prefix_word(line)) { line.next_word_ws(); AssignLabel(label, line, dir==AD_CONST); } else error = ERROR_UNEXPECTED_LABEL_ASSIGMENT_FORMAT; break; } case AD_STRING: return Directive_String(line); case AD_UNDEF: return Directive_Undef(line); case AD_INCSYM: return IncludeSymbols(line); case AD_LABPOOL: { strref name = line.split_range_trim(word_char_range, line[0]=='.' ? 1 : 0); AddLabelPool(name, line); break; } case AD_IF: if (NewConditional()) { // Start new conditional block CheckConditionalDepth(); // Check if nesting bool conditional_result; error = EvalStatement(line, conditional_result); if (conditional_result) ConsumeConditional(); else SetConditional(); } break; case AD_IFDEF: if (NewConditional()) { // Start new conditional block CheckConditionalDepth(); // Check if nesting bool conditional_result; error = EvalStatement(line, conditional_result); strref name = line.get_trimmed_ws(); if (GetLabel(name) != nullptr || GetString(name) != nullptr) ConsumeConditional(); else SetConditional(); } break; case AD_ELSE: if (ConditionalAsm()) { if (ConditionalConsumed()) ConditionalElse(); else error = ERROR_ELSE_WITHOUT_IF; } else if (ConditionalAvail()) EnableConditional(true); break; case AD_ELIF: if (ConditionalAsm()) { if (ConditionalConsumed()) ConditionalElse(); else error = ERROR_ELSE_WITHOUT_IF; } else if (ConditionalAvail()) { bool conditional_result; error = EvalStatement(line, conditional_result); EnableConditional(conditional_result); } break; case AD_ENDIF: if (ConditionalAsm()) { if (ConditionalConsumed()) CloseConditional(); else error = ERROR_ENDIF_WITHOUT_CONDITION; } else { conditional_nesting[conditional_depth]--; if (ConditionalAsm()) CloseConditional(); } break; case AD_ENUM: case AD_STRUCT: return Directive_ENUM_STRUCT(line, dir); case AD_REPT: return Directive_Rept(line); case AD_INCDIR: AddIncludeFolder(line.between('"', '"')); break; case AD_A16: // A16: Set 16 bit accumulator mode accumulator_16bit = true; break; case AD_A8: // A8: Set 8 bit accumulator mode accumulator_16bit = false; break; case AD_XY16: // A16: Set 16 bit accumulator mode index_reg_16bit = true; break; case AD_XY8: // A8: Set 8 bit accumulator mode index_reg_16bit = false; break; case AD_MX: if (line) { line.trim_whitespace(); int value = 0; error = EvalExpression(line, etx, value); index_reg_16bit = !(value&1); accumulator_16bit = !(value&2); } break; case AD_ABORT: line.trim_whitespace(); if (line) printf("Assembler aborted: " STRREF_FMT "\n", STRREF_ARG(line)); return ERROR_ABORTED; case AD_LST: line.clear(); break; case AD_DUMMY: line.trim_whitespace(); if (line) { int reorg; if (STATUS_OK == EvalExpression(line, etx, reorg)) { DummySection(reorg); break; } } DummySection(); break; case AD_DUMMY_END: while (CurrSection().IsDummySection()) { EndSection(); if (SectionId()==0) break; } break; case AD_DS: return Directive_DS(line); } return error; } // Make an educated guess at the intended address mode from an opcode argument StatusCode Asm::GetAddressMode(strref line, bool flipXY, uint32_t validModes, AddrMode &addrMode, int &len, strref &expression) { bool force_zp = false; bool force_24 = false; bool force_abs = false; bool need_more = true; strref arg, deco; len = 0; while (need_more) { need_more = false; uint8_t c = line.get_first(); if (!c) addrMode = AMB_NON; else if (!force_abs && (c == '[' || (c == '(' && (validModes&(AMM_REL | AMM_REL_X | AMM_ZP_REL | AMM_ZP_REL_X | AMM_ZP_Y_REL))))) { deco = line.scoped_block_skip(); line.skip_whitespace(); expression = deco.split_token_trim(','); addrMode = c == '[' ? (force_zp ? AMB_ZP_REL_L : AMB_REL_L) : (force_zp ? AMB_ZP_REL : AMB_REL); if (strref::tolower(deco[0]) == 'x') addrMode = c == '[' ? AMB_ILL : AMB_ZP_REL_X; else if (line[0] == ',') { ++line; line.skip_whitespace(); if (strref::tolower(line[0]) == 'y') { if (strref::tolower(deco[0]) == 's') addrMode = AMB_STK_REL_Y; else addrMode = c == '[' ? AMB_ZP_REL_Y_L : AMB_ZP_Y_REL; ++line; } } } else if (c == '#') { ++line; addrMode = AMB_IMM; expression = line; } else if (line) { if (line[0]=='.' && strref::is_ws(line[2])) { switch (strref::tolower(line[1])) { case 'z': force_zp = true; line += 3; need_more = true; len = 1; break; case 'b': line += 3; need_more = true; len = 1; break; case 'w': line += 3; need_more = true; len = 2; break; case 'l': force_24 = true; line += 3; need_more = true; len = 3; break; case 'a': force_abs = true; line += 3; need_more = true; break; } } if (!need_more) { if (strref("A").is_prefix_word(line)) { addrMode = AMB_ACC; } else { // absolute (zp, offs x, offs y) addrMode = force_24 ? AMB_ABS_L : (force_zp ? AMB_ZP : AMB_ABS); expression = line.split_token_trim(','); if (line && (line[0]=='s' || line[0]=='S')) addrMode = AMB_STK; else { bool relX = line && (line[0]=='x' || line[0]=='X'); bool relY = line && (line[0]=='y' || line[0]=='Y'); if ((flipXY && relY) || (!flipXY && relX)) addrMode = force_24 ? AMB_ABS_L_X : (force_zp ? AMB_ZP_X : AMB_ABS_X); else if ((flipXY && relX) || (!flipXY && relY)) { if (force_zp) { return ERROR_INSTRUCTION_NOT_ZP; } addrMode = AMB_ABS_Y; } } } } } } return STATUS_OK; } // Push an opcode to the output buffer in the current section StatusCode Asm::AddOpcode(strref line, int index, strref source_file) { StatusCode error = STATUS_OK; strref expression; // allowed modes uint32_t validModes = opcode_table[index].modes; // instruction parameter length override int op_param = 0; // Get the addressing mode and the expression it refers to AddrMode addrMode; switch (validModes) { case AMC_BBR: addrMode = AMB_ZP_ABS; expression = line.split_token_trim(','); if (!expression || !line) return ERROR_INVALID_ADDRESSING_MODE; break; case AMM_BRA: addrMode = AMB_ABS; expression = line; break; case AMM_ACC: case (AMM_ACC|AMM_NON): case AMM_NON: addrMode = AMB_NON; break; case AMM_BLK_MOV: addrMode = AMB_BLK_MOV; expression = line.before_or_full(','); break; default: error = GetAddressMode(line, !!(validModes & AMM_FLIPXY), validModes, addrMode, op_param, expression); break; } int value = 0; int target_section = -1; int target_section_offs = -1; int8_t target_section_shift = 0; bool evalLater = false; if (expression) { struct EvalContext etx; SetEvalCtxDefaults(etx); if (validModes & (AMM_BRANCH | AMM_BRANCH_L)) etx.relative_section = SectionId(); error = EvalExpression(expression, etx, value); if (error == STATUS_NOT_READY || error == STATUS_XREF_DEPENDENT) { evalLater = true; error = STATUS_OK; } else if (error == STATUS_RELATIVE_SECTION) { target_section = lastEvalSection; target_section_offs = lastEvalValue; target_section_shift = lastEvalShift; } else if (error != STATUS_OK) return error; } // check if address is in zero page range and should use a ZP mode instead of absolute if (!evalLater && value>=0 && value<0x100 && (error != STATUS_RELATIVE_SECTION || (target_section>=0 && allSections[target_section].type==ST_ZEROPAGE))) { switch (addrMode) { case AMB_ABS: if (validModes & AMM_ZP) addrMode = AMB_ZP; else if (validModes & AMM_ABS_L) addrMode = AMB_ABS_L; break; case AMB_ABS_X: if (validModes & AMM_ZP_X) addrMode = AMB_ZP_X; else if (validModes & AMM_ABS_L_X) addrMode = AMB_ABS_L_X; break; default: break; } } // Check if an explicit 24 bit address if (expression[0] == '$' && (expression + 1).len_hex()>4) { if (addrMode==AMB_ABS&&(validModes & AMM_ABS_L)) { addrMode = AMB_ABS_L; } else if (addrMode==AMB_ABS_X&&(validModes & AMM_ABS_L_X)) { addrMode = AMB_ABS_L_X; } } if (!(validModes & (1 << addrMode))) { if (addrMode==AMB_ZP_REL_X&&(validModes & AMM_REL_X)) { addrMode = AMB_REL_X; } else if (addrMode==AMB_REL&&(validModes & AMM_ZP_REL)) { addrMode = AMB_ZP_REL; } else if (addrMode==AMB_ABS&&(validModes & AMM_ABS_L)) { addrMode = AMB_ABS_L; } else if (addrMode==AMB_ABS_X&&(validModes & AMM_ABS_L_X)) { addrMode = AMB_ABS_L_X; } else if (addrMode==AMB_REL_L&&(validModes & AMM_ZP_REL_L)) { addrMode = AMB_ZP_REL_L; } else if (Merlin()&&addrMode==AMB_IMM && validModes==AMM_ABS) { addrMode = AMB_ABS; // Merlin seems to allow this } else if (Merlin()&&addrMode==AMB_ABS && validModes==AMM_ZP_REL) { addrMode = AMB_ZP_REL; // Merlin seems to allow this } else { return ERROR_INVALID_ADDRESSING_MODE; } } // Add the instruction and argument to the code if (error == STATUS_OK || error == STATUS_RELATIVE_SECTION) { uint8_t opcode = opcode_table[index].aCodes[addrMode]; StatusCode cap_status = CheckOutputCapacity(4); if (cap_status != STATUS_OK) return error; AddByte(opcode); CODE_ARG codeArg = CA_NONE; if (validModes & AMM_BRANCH_L) codeArg = CA_BRANCH_16; else if (validModes & AMM_BRANCH) codeArg = CA_BRANCH; else { switch (addrMode) { case AMB_ZP_REL_X: // 0 ($12:x) case AMB_ZP: // 1 $12 case AMB_ZP_Y_REL: // 4 ($12),y case AMB_ZP_X: // 5 $12,x case AMB_ZP_REL: // b ($12) case AMB_ZP_REL_L: // e [$02] case AMB_ZP_REL_Y_L: // f [$00],y case AMB_STK: // 12 $12,s case AMB_STK_REL_Y: // 13 ($12,s),y codeArg = CA_ONE_BYTE; break; case AMB_ABS_Y: // 6 $1234,y case AMB_ABS_X: // 7 $1234,x case AMB_ABS: // 3 $1234 case AMB_REL: // 8 ($1234) case AMB_REL_X: // c ($1234,x) case AMB_REL_L: // 14 [$1234] codeArg = CA_TWO_BYTES; break; case AMB_ABS_L: // 10 $e00001 case AMB_ABS_L_X: // 11 $123456,x codeArg = CA_THREE_BYTES; break; case AMB_ZP_ABS: // d $12, label codeArg = CA_BYTE_BRANCH; break; case AMB_BLK_MOV: // 15 $12,$34 codeArg = CA_TWO_ARG_BYTES; break; case AMB_IMM: // 2 #$12 if (op_param && (validModes&(AMM_IMM_DBL_A | AMM_IMM_DBL_XY))) codeArg = op_param == 2 ? CA_TWO_BYTES : CA_ONE_BYTE; else if ((validModes&(AMM_IMM_DBL_A | AMM_IMM_DBL_XY)) && expression[0]=='$' && (expression+1).len_hex()==4) codeArg = CA_TWO_BYTES; else if (((validModes&AMM_IMM_DBL_A) && accumulator_16bit) || ((validModes&AMM_IMM_DBL_XY) && index_reg_16bit)) codeArg = CA_TWO_BYTES; else codeArg = CA_ONE_BYTE; break; case AMB_ACC: // 9 A case AMB_NON: // a default: break; } } switch (codeArg) { case CA_ONE_BYTE: if (evalLater) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], expression, source_file, LateEval::LET_BYTE); else if (error == STATUS_RELATIVE_SECTION) CurrSection().AddReloc(target_section_offs, CurrSection().DataOffset(), target_section, 1, target_section_shift); AddByte(value); break; case CA_TWO_BYTES: if (evalLater) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], expression, source_file, LateEval::LET_ABS_REF); else if (error == STATUS_RELATIVE_SECTION) { CurrSection().AddReloc(target_section_offs, CurrSection().DataOffset(), target_section, 2, target_section_shift); value = 0; } AddWord(value); break; case CA_THREE_BYTES: if (evalLater) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], expression, source_file, LateEval::LET_ABS_L_REF); else if (error == STATUS_RELATIVE_SECTION) { CurrSection().AddReloc(target_section_offs, CurrSection().DataOffset(), target_section, 3, target_section_shift); value = 0; } AddTriple(value); break; case CA_TWO_ARG_BYTES: { if (evalLater) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], expression, source_file, LateEval::LET_BYTE); else if (error == STATUS_RELATIVE_SECTION) { CurrSection().AddReloc(target_section_offs, CurrSection().DataOffset(), target_section, 1, target_section_shift); } AddByte(value); struct EvalContext etx; SetEvalCtxDefaults(etx); etx.pc = CurrSection().GetPC()-2; line.split_token_trim(','); error = EvalExpression(line, etx, value); if (error==STATUS_NOT_READY || error == STATUS_XREF_DEPENDENT) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], line, source_file, LateEval::LET_BYTE); AddByte(value); break; } case CA_BRANCH: if (evalLater) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], expression, source_file, LateEval::LET_BRANCH); else if (((int)value - (int)CurrSection().GetPC()-1) < -128 || ((int)value - (int)CurrSection().GetPC()-1) > 127) error = ERROR_BRANCH_OUT_OF_RANGE; AddByte(evalLater ? 0 : (uint8_t)((int)value - (int)CurrSection().GetPC()) - 1); break; case CA_BRANCH_16: if (evalLater) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], expression, source_file, LateEval::LET_BRANCH_16); AddWord(evalLater ? 0 : (value-(CurrSection().GetPC()+2))); break; case CA_BYTE_BRANCH: { if (evalLater) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], expression, source_file, LateEval::LET_BYTE); else if (error == STATUS_RELATIVE_SECTION) CurrSection().AddReloc(target_section_offs, CurrSection().DataOffset(), target_section, 1, target_section_shift); AddByte(value); struct EvalContext etx; SetEvalCtxDefaults(etx); etx.pc = CurrSection().GetPC()-2; etx.relative_section = SectionId(); error = EvalExpression(line, etx, value); if (error==STATUS_NOT_READY || error == STATUS_XREF_DEPENDENT) AddLateEval(CurrSection().DataOffset(), CurrSection().GetPC(), scope_address[scope_depth], line, source_file, LateEval::LET_BRANCH); else if (((int)value - (int)CurrSection().GetPC() - 1) < -128 || ((int)value - (int)CurrSection().GetPC() - 1) > 127) error = ERROR_BRANCH_OUT_OF_RANGE; AddByte((error == STATUS_NOT_READY || error == STATUS_XREF_DEPENDENT) ? 0 : (uint8_t)((int)value - (int)CurrSection().GetPC()) - 1); break; } case CA_NONE: break; } } return error; } // Build a line of code void Asm::PrintError(strref line, StatusCode error) { strown<512> errorText; if (contextStack.has_work()) { errorText.sprintf("Error " STRREF_FMT "(%d): ", STRREF_ARG(contextStack.curr().source_name), contextStack.curr().source_file.count_lines(line)+1); } else { errorText.append("Error: "); } errorText.append(aStatusStrings[error]); errorText.append(" \""); errorText.append(line.get_trimmed_ws()); errorText.append("\"\n"); errorText.c_str(); fwrite(errorText.get(), errorText.get_len(), 1, stderr); error_encountered = true; } // Build a line of code StatusCode Asm::BuildLine(strref line) { StatusCode error = STATUS_OK; // MERLIN: First char of line is * means comment if (Merlin()&&line[0]=='*') { return STATUS_OK; } // remember for listing int start_section = SectionId(); int start_address = CurrSection().address; strref code_line = line; list_flags = 0; while (line && error == STATUS_OK) { strref line_start = line; char char0 = line[0]; // first char including white space line.skip_whitespace(); // skip to first character line = line.before_or_full(';'); // clip any line comments line = line.before_or_full(c_comment); line.clip_trailing_whitespace(); if (line[0]==':'&&!Merlin()) { ++line; } // Kick Assembler macro prefix (incompatible with merlin) strref line_nocom = line; strref operation = line.split_range(Merlin() ? label_end_char_range_merlin : label_end_char_range); char char1 = operation[0]; // first char of first word char charE = operation.get_last(); // end char of first word line.trim_whitespace(); bool force_label = charE==':' || charE=='$'; if (!force_label && Merlin()&&(line||operation)) { // MERLIN fixes and PoP does some naughty stuff like 'and = 0' force_label = (!strref::is_ws(char0)&&char0!='{' && char0!='}')||char1==']'||charE=='?'; } else if (!Merlin()&&line[0]==':') { force_label = true; } if (!operation && !force_label) { if (ConditionalAsm()) { // scope open / close switch (line[0]) { case '{': error = EnterScope(); brace_depth++; list_flags |= ListLine::CYCLES_START; if (error == STATUS_OK) { ++line; line.skip_whitespace(); } break; case '}': // check for late eval of anything with an end scope error = ExitScope(); for (LabelPool *pool = labelPools.getValues(), *end = pool+labelPools.count(); pool!=end; pool++) { pool->ExitScope((uint16_t)brace_depth); } brace_depth--; list_flags |= ListLine::CYCLES_STOP; if (error == STATUS_OK) { ++line; line.skip_whitespace(); } break; case '*': // if first char is '*' this seems like a line comment on some assemblers line.clear(); break; case 127: ++line; // bad character? break; } } else { line.clear(); } } else { // ignore leading period for instructions and directives - not for labels strref label = operation; if ((!Merlin()&&operation[0]==':')||operation[0]=='.') { ++operation; } operation = operation.before_or_full('.'); int op_idx = LookupOpCodeIndex(operation.fnv1a_lower(), aInstructions, num_instructions); if (op_idx >= 0 && !force_label && (aInstructions[op_idx].type==OT_DIRECTIVE || line[0]!='=')) { if (line_nocom.is_substr(operation.get())) { line = line_nocom + strl_t(operation.get()+operation.get_len()-line_nocom.get()); line.skip_whitespace(); } if (aInstructions[op_idx].type==OT_DIRECTIVE) { error = ApplyDirective((AssemblerDirective)aInstructions[op_idx].index, line, contextStack.curr().source_file); list_flags |= ListLine::KEYWORD; } else if (ConditionalAsm() && aInstructions[op_idx].type == OT_MNEMONIC) { error = AddOpcode(line, aInstructions[op_idx].index, contextStack.curr().source_file); list_flags |= ListLine::MNEMONIC; } line.clear(); } else if (!ConditionalAsm()) { line.clear(); // do nothing if conditional nesting so clear the current line } else if (line.get_first()=='=') { ++line; error = AssignLabel(label, line); line.clear(); list_flags |= ListLine::KEYWORD; } else if (keyword_equ.is_prefix_word(line)) { line += keyword_equ.get_len(); line.skip_whitespace(); error = AssignLabel(label, line); line.clear(); list_flags |= ListLine::KEYWORD; } else { uint32_t nameHash = label.fnv1a(); uint32_t macro = FindLabelIndex(nameHash, macros.getKeys(), macros.count()); bool gotConstruct = false; while (macro < macros.count() && nameHash==macros.getKey(macro)) { if (macros.getValue(macro).name.same_str_case(label)) { error = BuildMacro(macros.getValue(macro), line); gotConstruct = true; line.clear(); // don't process codes from here break; } macro++; } if (!gotConstruct) { uint32_t labPool = FindLabelIndex(nameHash, labelPools.getKeys(), labelPools.count()); gotConstruct = false; while (labPool < labelPools.count() && nameHash==labelPools.getKey(labPool)) { if (labelPools.getValue(labPool).pool_name.same_str_case(label)) { error = AssignPoolLabel(labelPools.getValue(labPool), line); gotConstruct = true; line.clear(); // don't process codes from here break; } labPool++; } if (!gotConstruct) { if (StringSymbol *pStr = GetString(label)) { StringAction(pStr, line); line.clear(); } else if (Merlin() && strref::is_ws(line_start[0])) { error = ERROR_UNDEFINED_CODE; } else if (label[0]=='$') { line.clear(); } else { if (label.get_last()==':') { label.clip(1); } error = AddressLabel(label); line = line_start + int(label.get() + label.get_len() -line_start.get()); if (line[0]==':'||line[0]=='?') { ++line; } // there may be codes after the label list_flags |= ListLine::KEYWORD; } } } } } // Check for unterminated condition in source if (!contextStack.curr().next_source && (!ConditionalAsm() || ConditionalConsumed() || !conditional_depth)) { if (Merlin()) { // this isn't a listed feature, conditional_nesting[0] = 0; // some files just seem to get away without closing conditional_consumed[0] = 0; conditional_depth = 0; } else { PrintError(conditional_source[conditional_depth], ERROR_UNTERMINATED_CONDITION); return ERROR_UNTERMINATED_CONDITION; } } if (line.same_str_case(line_start)) { error = ERROR_UNABLE_TO_PROCESS; } else if (CurrSection().type==ST_ZEROPAGE && CurrSection().address>0x100) { error = ERROR_ZEROPAGE_SECTION_OUT_OF_RANGE; } if (error>STATUS_XREF_DEPENDENT) { PrintError(line_start, error); } // dealt with error, continue with next instruction unless too broken if (errorsize()==curr.pListing->capacity()) { curr.pListing->reserve(curr.pListing->size()+256); } if (((list_flags&(ListLine::KEYWORD|ListLine::CYCLES_START|ListLine::CYCLES_STOP)) || (curr.address != start_address && curr.size())) && !curr.IsDummySection()) { struct ListLine lst; lst.address = start_address - curr.start_address; lst.size = curr.address - start_address; lst.code = contextStack.curr().source_file; lst.source_name = contextStack.curr().source_name; lst.line_offs = int(code_line.get() - lst.code.get()); lst.flags = list_flags; curr.pListing->push_back(lst); } } } return error; } // Build a segment of code (file or macro) StatusCode Asm::BuildSegment() { StatusCode error = STATUS_OK; while (contextStack.curr().read_source) { contextStack.curr().next_source = contextStack.curr().read_source; error = BuildLine(contextStack.curr().next_source.line()); if (error>ERROR_STOP_PROCESSING_ON_HIGHER) { break; } contextStack.curr().read_source = contextStack.curr().next_source; } if (error == STATUS_OK) { error = CheckLateEval(strref(), CurrSection().GetPC()); } return error; } // Produce the assembler listing #define MAX_DEPTH_CYCLE_COUNTER 64 struct cycleCnt { int base; int16_t plus, a16, x16, dp; void clr() { base = 0; plus = a16 = x16 = dp = 0; } void add(uint8_t c) { if (c != 0xff) { base += (c >> 1) & 7; plus += c & 1; if (c & 0xf0) { int i = c >> 4; if (i <= 8) { a16 += timing_65816_plus[i][0]; x16 += timing_65816_plus[i][1]; dp += timing_65816_plus[i][2]; } } } } int plus_acc() { return plus + a16 + x16 + dp; } void combine(const struct cycleCnt &o) { base += o.base; plus += o.plus; a16 += o.a16; x16 += o.x16; dp += o.dp; } bool complex() const { return a16 != 0 || x16 != 0 || dp != 0; } static int get_base(uint8_t c) { return (c & 0xf) >> 1; } static int sum_plus(uint8_t c) { if (c==0xff) { return 0; } int i = c >> 4; if (i) { return i<=8 ? (timing_65816_plus[i][0]+timing_65816_plus[i][1]+timing_65816_plus[i][2]) : 0; } return c & 1; } }; bool Asm::List(strref filename) { FILE *f = stdout; bool opened = false; if (filename) { f = fopen(strown<512>(filename).c_str(), "w"); if (!f) { return false; } opened = true; } // ensure that the greatest instruction set referenced is used for listing if (list_cpu!=cpu) { SetCPU(list_cpu); } // Build a disassembly lookup table uint8_t mnemonic[256]; uint8_t addrmode[256]; memset(mnemonic, 255, sizeof(mnemonic)); memset(addrmode, 255, sizeof(addrmode)); for (int i = 0; i < opcode_count; i++) { for (int j = AMB_COUNT-1; j >= 0; j--) { if (opcode_table[i].modes & (1 << j)) { uint8_t op = opcode_table[i].aCodes[j]; if (addrmode[op]==255) { mnemonic[op] = (uint8_t)i; addrmode[op] = (uint8_t)j; } } } } struct cycleCnt cycles[MAX_DEPTH_CYCLE_COUNTER]; int16_t cycles_depth = 0; memset(cycles, 0, sizeof(cycles)); strref prev_src; int prev_offs = 0; for (std::vector

::iterator si = allSections.begin(); si != allSections.end(); ++si) { if (si->type==ST_REMOVED) { continue; } if (si->address_assigned) fprintf(f, "Section " STRREF_FMT " (%d, %s): $%04x-$%04x\n", STRREF_ARG(si->name), (int)(&*si - &allSections[0]), si->type>=0 && si->typetype] : "???", si->start_address, si->address); else fprintf(f, "Section " STRREF_FMT " (%d, %s) (relocatable)\n", STRREF_ARG(si->name), (int)(&*si - &allSections[0]), str_section_type[si->type]); if (!si->pListing) continue; for (Listing::iterator li = si->pListing->begin(); li != si->pListing->end(); ++li) { strown<256> out; const struct ListLine &lst = *li; if (prev_src.fnv1a() != lst.source_name.fnv1a() || lst.line_offs < prev_offs) { fprintf(f, STRREF_FMT "(%d):\n", STRREF_ARG(lst.source_name), lst.code.count_lines(lst.line_offs)); prev_src = lst.source_name; } else { strref prvline = lst.code.get_substr(prev_offs, lst.line_offs - prev_offs); prvline.next_line(); if (prvline.count_lines() < 5) { while (strref space_line = prvline.line()) { space_line.clip_trailing_whitespace(); strown<128> line_fix(space_line); for (strl_t pos = 0; pos < line_fix.len(); ++pos) { if (line_fix[pos]=='\t') { line_fix.exchange(pos, 1, pos&1 ? strref(" ") : strref(" ")); } } out.pad_to(' ', aCPUs[cpu].timing ? 40 : 33); out.append(line_fix.get_strref()); fprintf(f, STRREF_FMT "\n", STRREF_ARG(out)); out.clear(); } } else { fprintf(f, STRREF_FMT "(%d):\n", STRREF_ARG(lst.source_name), lst.code.count_lines(lst.line_offs)); } } if (lst.size) { out.sprintf_append("$%04x ", lst.address+si->start_address); } int s = lst.wasMnemonic() ? (lst.size < 4 ? lst.size : 4) : (lst.size < 8 ? lst.size : 8); if (si->output && si->output_capacity >= size_t(lst.address + s)) { for (int b = 0; boutput[lst.address+b]); } } if (lst.startClock() && cycles_depth%d", cycles_depth); } if (lst.stopClock()) { out.pad_to(' ', 6); if (cycles[cycles_depth].complex()) { out.sprintf_append("c<%d = %d + m%d + i%d + d%d", cycles_depth, cycles[cycles_depth].base, cycles[cycles_depth].a16, cycles[cycles_depth].x16, cycles[cycles_depth].dp); } else { out.sprintf_append("c<%d = %d + %d", cycles_depth, cycles[cycles_depth].base, cycles[cycles_depth].plus_acc()); } if (cycles_depth) { cycles_depth--; cycles[cycles_depth].combine(cycles[cycles_depth + 1]); } } if (lst.size && lst.wasMnemonic()) { out.pad_to(' ', 18); uint8_t *buf = si->output + lst.address; uint8_t op = mnemonic[*buf]; uint8_t am = addrmode[*buf]; if (op != 255 && am != 255 && am<(sizeof(aAddrModeFmt)/sizeof(aAddrModeFmt[0]))) { const char *fmt = aAddrModeFmt[am]; if (opcode_table[op].modes & AMM_FLIPXY) { if (am == AMB_ZP_X) fmt = "%s $%02x,y"; else if (am == AMB_ABS_X) fmt = "%s $%04x,y"; } if (opcode_table[op].modes & AMM_ZP_ABS) { out.sprintf_append(fmt, opcode_table[op].instr, buf[1], (char)buf[2]+lst.address+si->start_address+3); } else if (opcode_table[op].modes & AMM_BRANCH) { out.sprintf_append(fmt, opcode_table[op].instr, (char)buf[1]+lst.address+si->start_address+2); } else if (opcode_table[op].modes & AMM_BRANCH_L) { out.sprintf_append(fmt, opcode_table[op].instr, (int16_t)(buf[1]|(buf[2]<<8))+lst.address+si->start_address+3); } else if (am==AMB_NON||am==AMB_ACC) { out.sprintf_append(fmt, opcode_table[op].instr); } else if (am==AMB_ABS||am==AMB_ABS_X||am==AMB_ABS_Y||am==AMB_REL||am==AMB_REL_X||am==AMB_REL_L) { out.sprintf_append(fmt, opcode_table[op].instr, buf[1]|(buf[2]<<8)); } else if (am==AMB_ABS_L||am==AMB_ABS_L_X) { out.sprintf_append(fmt, opcode_table[op].instr, buf[1]|(buf[2]<<8)|(buf[3]<<16)); } else if (am==AMB_BLK_MOV) { out.sprintf_append(fmt, opcode_table[op].instr, buf[1], buf[2]); } else if (am==AMB_IMM && lst.size==3) { out.sprintf_append("%s #$%04x", opcode_table[op].instr, buf[1]|(buf[2]<<8)); } else { out.sprintf_append(fmt, opcode_table[op].instr, buf[1]); } if (aCPUs[cpu].timing) { cycles[cycles_depth].add(aCPUs[cpu].timing[*buf]); out.pad_to(' ', 33); if (cycleCnt::sum_plus(aCPUs[cpu].timing[*buf])==1) { out.sprintf_append("%d+", cycleCnt::get_base(aCPUs[cpu].timing[*buf])); } else if (cycleCnt::sum_plus(aCPUs[cpu].timing[*buf])) { out.sprintf_append("%d+%d", cycleCnt::get_base(aCPUs[cpu].timing[*buf]), cycleCnt::sum_plus(aCPUs[cpu].timing[*buf])); } else { out.sprintf_append("%d", cycleCnt::get_base(aCPUs[cpu].timing[*buf])); } } } } out.pad_to(' ', aCPUs[cpu].timing ? 40 : 33); strref line = lst.code.get_skipped(lst.line_offs).get_line(); line.clip_trailing_whitespace(); strown<128> line_fix(line); for (strl_t pos = 0; pos < line_fix.len(); ++pos) { if (line_fix[pos] == '\t') line_fix.exchange(pos, 1, pos & 1 ? strref(" ") : strref(" ")); } out.append(line_fix.get_strref()); fprintf(f, STRREF_FMT "\n", STRREF_ARG(out)); prev_offs = lst.line_offs; } } if (opened) { fclose(f); } return true; } // Create a listing of all valid instructions and addressing modes bool Asm::AllOpcodes(strref filename) { FILE *f = stdout; bool opened = false; if (filename) { f = fopen(strown<512>(filename).c_str(), "w"); if (!f) { return false; } opened = true; } for (int i = 0; i < opcode_count; i++) { uint32_t modes = opcode_table[i].modes; for (int a = 0; a < AMB_COUNT; a++) { if (modes & (1<=FIRST_ERROR) { break; } contextStack.curr().restart(); error = STATUS_OK; } } if (error==STATUS_OK) { if (!obj_target) { LinkZP(); } error = CheckLateEval(); if (error>STATUS_XREF_DEPENDENT) { strown<512> errorText; errorText.copy("Error: "); errorText.append(aStatusStrings[error]); fwrite(errorText.get(), errorText.get_len(), 1, stderr); } else { CheckLateEval(strref(), -1, true); } // output any missing xref's if (!obj_target) { for (std::vector::iterator i = lateEval.begin(); i!=lateEval.end(); ++i) { strown<512> errorText; int line = i->source_file.count_lines(i->expression); errorText.sprintf("Error (%d): ", line+1); errorText.append("Failed to evaluate label \""); errorText.append(i->expression); if (line>=0) { errorText.append("\" : \""); errorText.append(i->source_file.get_line(line).get_trimmed_ws()); } errorText.append("\"\n"); fwrite(errorText.get(), errorText.get_len(), 1, stderr); } } } else { PrintError(&contextStack.curr() ? contextStack.curr().read_source.get_line() : strref(), error); } } // // // OBJECT FILE HANDLING // // struct ObjFileHeader { int16_t id; // 'x6' int16_t sections; int16_t relocs; int16_t labels; int16_t late_evals; int16_t map_symbols; uint32_t stringdata; int bindata; }; struct ObjFileStr { int offs; // offset into string table }; struct ObjFileSection { enum SectionFlags { OFS_DUMMY, OFS_FIXED, OFS_MERGED, }; struct ObjFileStr name; struct ObjFileStr exp_app; int start_address; int end_address; // address size int output_size; // assembled binary size int align_address; int16_t next_group; // next section of group int16_t first_group; // first section of group int16_t relocs; SectionType type; int8_t flags; }; struct ObjFileReloc { int base_value; int section_offset; int16_t target_section; int8_t bytes; int8_t shift; }; struct ObjFileLabel { enum LabelFlags { OFL_EVAL = (1<<15), // Evaluated (may still be relative) OFL_ADDR = (1<<14), // Address or Assign OFL_CNST = (1<<13), // Constant OFL_XDEF = OFL_CNST-1 // External (index into file array) }; struct ObjFileStr name; int value; int flags; // 1<<(LabelFlags) int16_t section; // -1 if resolved, file section # if section rel int16_t mapIndex; // -1 if resolved, index into map if relative }; struct ObjFileLateEval { struct ObjFileStr label; struct ObjFileStr expression; int address; // PC relative to section or fixed int target; // offset into section memory int16_t section; // section to target int16_t rept; // value of rept for this late eval int16_t scope; // PC start of scope int16_t type; // label, byte, branch, word (LateEval::Type) }; struct ObjFileMapSymbol { struct ObjFileStr name; // symbol name int value; int16_t section; bool local; // local labels are probably needed }; // Simple string pool, converts strref strings to zero terminated strings and returns the offset to the string in the pool. static int _AddStrPool(const strref str, pairArray *pLookup, char **strPool, uint32_t &strPoolSize, uint32_t &strPoolCap) { if (!str.get()||!str.get_len()) { return -1; } // empty string uint32_t hash = str.fnv1a(); uint32_t index = FindLabelIndex(hash, pLookup->getKeys(), pLookup->count()); if (indexcount()&&str.same_str_case(*strPool+pLookup->getValue(index))) { return pLookup->getValue(index); } int strOffs = strPoolSize; if ((strOffs + str.get_len() + 1) > strPoolCap) { strPoolCap = strOffs + (uint32_t)str.get_len() + 4096; char *strPoolGrow = (char*)malloc(strPoolCap); if (strPoolGrow) { if (*strPool) { memcpy(strPoolGrow, *strPool, strPoolSize); free(*strPool); } *strPool = strPoolGrow; } else { return -1; } } if (*strPool) { char *dest = *strPool + strPoolSize; memcpy(dest, str.get(), str.get_len()); dest[str.get_len()] = 0; strPoolSize += (uint32_t)str.get_len()+1; pLookup->insert(index, hash); pLookup->getValues()[index] = strOffs; } return strOffs; } StatusCode Asm::WriteObjectFile(strref filename) { if (allSections.size()==0) return ERROR_NOT_A_SECTION; if (FILE *f = fopen(strown<512>(filename).c_str(), "wb")) { struct ObjFileHeader hdr = { 0 }; hdr.id = 0x7836; hdr.sections = (int16_t)allSections.size(); hdr.relocs = 0; hdr.bindata = 0; for (std::vector

::iterator s = allSections.begin(); s!=allSections.end(); ++s) { if (s->type != ST_REMOVED) { if (s->pRelocs) { hdr.relocs += int16_t(s->pRelocs->size()); } hdr.bindata += s->size(); } } hdr.late_evals = (int16_t)lateEval.size(); hdr.map_symbols = (int16_t)map.size(); hdr.stringdata = 0; // labels don't include XREF labels hdr.labels = 0; for (uint32_t l = 0; l::iterator el = externals.begin(); el!=externals.end(); ++el) { hdr.labels += (int16_t)el->labels.count(); } char *stringPool = nullptr; uint32_t stringPoolCap = 0; pairArray stringArray; stringArray.reserve(hdr.labels * 2 + hdr.sections + hdr.late_evals*2); struct ObjFileSection *aSects = hdr.sections ? (struct ObjFileSection*)calloc(hdr.sections, sizeof(struct ObjFileSection)) : nullptr; struct ObjFileReloc *aRelocs = hdr.relocs ? (struct ObjFileReloc*)calloc(hdr.relocs, sizeof(struct ObjFileReloc)) : nullptr; struct ObjFileLabel *aLabels = hdr.labels ? (struct ObjFileLabel*)calloc(hdr.labels, sizeof(struct ObjFileLabel)) : nullptr; struct ObjFileLateEval *aLateEvals = hdr.late_evals ? (struct ObjFileLateEval*)calloc(hdr.late_evals, sizeof(struct ObjFileLateEval)) : nullptr; struct ObjFileMapSymbol *aMapSyms = hdr.map_symbols ? (struct ObjFileMapSymbol*)calloc(hdr.map_symbols, sizeof(struct ObjFileMapSymbol)) : nullptr; int sect = 0, reloc = 0, labs = 0, late = 0, map_sym = 0; memset(aRemapSects, 0xff, sizeof(int16_t) * hdr.sections); // discard the removed sections by making a table of skipped indices for (std::vector

::iterator si = allSections.begin(); si!=allSections.end(); ++si) { if (si->type != ST_REMOVED) aRemapSects[&*si-&allSections[0]] = (int16_t)sect++; } sect = 0; // write out sections and relocs if (hdr.sections) { for (std::vector

::iterator si = allSections.begin(); si!=allSections.end(); ++si) { if (si->type == ST_REMOVED) continue; struct ObjFileSection &s = aSects[sect++]; s.name.offs = _AddStrPool(si->name, &stringArray, &stringPool, hdr.stringdata, stringPoolCap); s.exp_app.offs = _AddStrPool(si->export_append, &stringArray, &stringPool, hdr.stringdata, stringPoolCap); s.output_size = si->size(); s.align_address = si->align_address; s.next_group = si->next_group >= 0 ? aRemapSects[si->next_group] : -1; s.first_group = si->first_group >= 0 ? aRemapSects[si->first_group] : -1; s.relocs = si->pRelocs ? (int16_t)(si->pRelocs->size()) : 0; s.start_address = si->start_address; s.end_address = si->address; s.type = si->type; s.flags = (si->IsDummySection() ? (1 << ObjFileSection::OFS_DUMMY) : 0) | (si->IsMergedSection() ? (1 << ObjFileSection::OFS_MERGED) : 0) | (si->address_assigned ? (1 << ObjFileSection::OFS_FIXED) : 0); if (si->pRelocs && si->pRelocs->size() && aRelocs) { for (relocList::iterator ri = si->pRelocs->begin(); ri!=si->pRelocs->end(); ++ri) { struct ObjFileReloc &r = aRelocs[reloc++]; r.base_value = ri->base_value; r.section_offset = ri->section_offset; r.target_section = ri->target_section >= 0 ? aRemapSects[ri->target_section] : -1; r.bytes = ri->bytes; r.shift = ri->shift; } } } } hdr.sections = (int16_t)sect; // write out labels if (hdr.labels) { for (uint32_t li = 0; li=0 ? aRemapSects[lo.section] : -1; l.mapIndex = (int16_t)lo.mapIndex; l.flags = (lo.constant ? ObjFileLabel::OFL_CNST : 0) | (lo.pc_relative ? ObjFileLabel::OFL_ADDR : 0) | (lo.evaluated ? ObjFileLabel::OFL_EVAL : 0) | (lo.external ? ObjFileLabel::OFL_XDEF : 0); } } } // protected labels included from other object files if (hdr.labels) { int file_index = 1; for (std::vector::iterator el = externals.begin(); el != externals.end(); ++el) { for (uint32_t li = 0; li < el->labels.count(); ++li) { Label &lo = el->labels.getValue(li); struct ObjFileLabel &l = aLabels[labs++]; l.name.offs = _AddStrPool(lo.label_name, &stringArray, &stringPool, hdr.stringdata, stringPoolCap); l.value = lo.value; l.section = lo.section >= 0 ? aRemapSects[lo.section] : -1; l.mapIndex = (int16_t)lo.mapIndex; l.flags = (lo.constant ? ObjFileLabel::OFL_CNST : 0) | (lo.pc_relative ? ObjFileLabel::OFL_ADDR : 0) | (lo.evaluated ? ObjFileLabel::OFL_EVAL : 0) | file_index; } file_index++; } } // write out late evals if (aLateEvals) { for (std::vector::iterator lei = lateEval.begin(); lei != lateEval.end(); ++lei) { struct ObjFileLateEval &le = aLateEvals[late++]; le.label.offs = _AddStrPool(lei->label, &stringArray, &stringPool, hdr.stringdata, stringPoolCap); le.expression.offs = _AddStrPool(lei->expression, &stringArray, &stringPool, hdr.stringdata, stringPoolCap); le.section = lei->section >= 0 ? aRemapSects[lei->section] : -1; le.rept = lei->rept; le.target = (int16_t)lei->target; le.address = lei->address; le.scope = (int16_t)lei->scope; le.type = (int16_t)lei->type; } } // write out map symbols if (aMapSyms) { for (MapSymbolArray::iterator mi = map.begin(); mi != map.end(); ++mi) { struct ObjFileMapSymbol &ms = aMapSyms[map_sym++]; ms.name.offs = _AddStrPool(mi->name, &stringArray, &stringPool, hdr.stringdata, stringPoolCap); ms.value = mi->value; ms.local = mi->local; ms.section = mi->section >= 0 ? aRemapSects[mi->section] : -1; } } // write out the file fwrite(&hdr, sizeof(hdr), 1, f); fwrite(aSects, sizeof(aSects[0]), sect, f); fwrite(aRelocs, sizeof(aRelocs[0]), reloc, f); fwrite(aLabels, sizeof(aLabels[0]), labs, f); fwrite(aLateEvals, sizeof(aLateEvals[0]), late, f); fwrite(aMapSyms, sizeof(aMapSyms[0]), map_sym, f); fwrite(stringPool, hdr.stringdata, 1, f); for (std::vector

::iterator si = allSections.begin(); si!=allSections.end(); ++si) { if (!si->IsDummySection()&&!si->IsMergedSection()&&si->size()!=0&&si->type!=ST_REMOVED) { fwrite(si->output, si->size(), 1, f); } } // done with I/O fclose(f); if (aRemapSects) { free(aRemapSects); } if (stringPool) { free(stringPool); } if (aMapSyms) { free(aMapSyms); } if (aLateEvals) { free(aLateEvals); } if (aLabels) { free(aLabels); } if (aRelocs) { free(aRelocs); } if (aSects) { free(aSects); } stringArray.clear(); } return STATUS_OK; } StatusCode Asm::ReadObjectFile(strref filename, int link_to_section) { size_t size; strown<512> file; file.copy(filename); // Merlin mostly uses extension-less files, append .x65 as a default if ((Merlin() && !file.has_suffix(".x65")) || filename.find('.')<0) file.append(".x65"); int file_index = (int)externals.size(); if (char *data = LoadBinary(file.get_strref(), size)) { struct ObjFileHeader &hdr = *(struct ObjFileHeader*)data; size_t sum = sizeof(hdr) + hdr.sections*sizeof(struct ObjFileSection) + hdr.relocs * sizeof(struct ObjFileReloc) + hdr.labels * sizeof(struct ObjFileLabel) + hdr.late_evals * sizeof(struct ObjFileLateEval) + hdr.map_symbols * sizeof(struct ObjFileMapSymbol) + hdr.stringdata + hdr.bindata; if (hdr.id == 0x7836 && sum == size) { struct ObjFileSection *aSect = (struct ObjFileSection*)(&hdr + 1); struct ObjFileReloc *aReloc = (struct ObjFileReloc*)(aSect + hdr.sections); struct ObjFileLabel *aLabels = (struct ObjFileLabel*)(aReloc + hdr.relocs); struct ObjFileLateEval *aLateEval = (struct ObjFileLateEval*)(aLabels + hdr.labels); struct ObjFileMapSymbol *aMapSyms = (struct ObjFileMapSymbol*)(aLateEval + hdr.late_evals); const char *str_orig = (const char*)(aMapSyms + hdr.map_symbols); const char *bin_data = str_orig + hdr.stringdata; char *str_pool = (char*)malloc(hdr.stringdata); memcpy(str_pool, str_orig, hdr.stringdata); loadedData.push_back(str_pool); int prevSection = SectionId(); int16_t *aSctRmp = (int16_t*)malloc(hdr.sections * sizeof(int16_t)); int last_linked_section = link_to_section; while (last_linked_section>=0&&allSections[last_linked_section].next_group>=0) { last_linked_section = allSections[last_linked_section].next_group; } // sections for (int si = 0; si < hdr.sections; si++) { int16_t f = aSect[si].flags; if (f & (1 << ObjFileSection::OFS_MERGED)) continue; if (f & (1 << ObjFileSection::OFS_DUMMY)) { if (f&(1 << ObjFileSection::OFS_FIXED)) { DummySection(aSect[si].start_address); CurrSection().AddBin(nullptr, aSect[si].end_address - aSect[si].start_address); } else { DummySection(); CurrSection().AddBin(nullptr, aSect[si].end_address - aSect[si].start_address); } } else { if (f&(1<=0 ? strref(str_pool+aSect[si].name.offs) : strref(), aSect[si].start_address); } else { SetSection(aSect[si].name.offs>=0 ? strref(str_pool+aSect[si].name.offs) : strref()); } Section &s = CurrSection(); s.include_from = filename; s.export_append = aSect[si].exp_app.offs>=0 ? strref(str_pool + aSect[si].name.offs) : strref(); s.align_address = aSect[si].align_address; s.address = aSect[si].end_address; s.type = aSect[si].type; if (aSect[si].output_size) { s.output = (uint8_t*)malloc(aSect[si].output_size); memcpy(s.output, bin_data, aSect[si].output_size); s.curr = s.output + aSect[si].output_size; s.output_capacity = aSect[si].output_size; bin_data += aSect[si].output_size; } if (last_linked_section>=0) { allSections[last_linked_section].next_group = SectionId(); s.first_group = allSections[last_linked_section].first_group >=0 ? allSections[last_linked_section].first_group : last_linked_section; last_linked_section = SectionId(); } } aSctRmp[si] = (int16_t)allSections.size()-1; } // fix up groups and relocs int curr_reloc = 0; for (int si = 0; si < hdr.sections; si++) { Section &s = allSections[aSctRmp[si]]; if (aSect[si].first_group >= 0) s.first_group = aSctRmp[aSect[si].first_group]; if (aSect[si].next_group >= 0) s.first_group = aSctRmp[aSect[si].next_group]; for (int ri = 0; ri < aSect[si].relocs; ri++) { int r = ri + curr_reloc; struct ObjFileReloc &rs = aReloc[r]; allSections[aSctRmp[si]].AddReloc(rs.base_value, rs.section_offset, aSctRmp[rs.target_section], rs.bytes, rs.shift); } curr_reloc += aSect[si].relocs; } for (int mi = 0; mi < hdr.map_symbols; mi++) { struct ObjFileMapSymbol &m = aMapSyms[mi]; if (map.size()==map.capacity()) { map.reserve(map.size()+256); } MapSymbol sym; sym.name = m.name.offs>=0 ? strref(str_pool + m.name.offs) : strref(); sym.section = m.section >=0 ? aSctRmp[m.section] : m.section; sym.value = m.value; sym.local = m.local; map.push_back(sym); } for (int li = 0; li < hdr.labels; li++) { struct ObjFileLabel &l = aLabels[li]; strref name = l.name.offs >= 0 ? strref(str_pool + l.name.offs) : strref(); Label *lbl = GetLabel(name); int16_t f = (int16_t)l.flags; int external = f & ObjFileLabel::OFL_XDEF; if (external == ObjFileLabel::OFL_XDEF) { if (!lbl) { lbl = AddLabel(name.fnv1a()); } // insert shared label else if (!lbl->reference) { continue; } } else { // insert protected label while ((file_index + external) >= (int)externals.size()) { if (externals.size()==externals.capacity()) { externals.reserve(externals.size()+32); } externals.push_back(ExtLabels()); } uint32_t hash = name.fnv1a(); uint32_t index = FindLabelIndex(hash, externals[file_index].labels.getKeys(), externals[file_index].labels.count()); externals[file_index].labels.insert(index, hash); lbl = externals[file_index].labels.getValues() + index; } lbl->label_name = name; lbl->pool_name.clear(); lbl->value = l.value; lbl->section = l.section >= 0 ? aSctRmp[l.section] : l.section; lbl->mapIndex = l.mapIndex >= 0 ? (l.mapIndex + (int)map.size()) : -1; lbl->evaluated = !!(f & ObjFileLabel::OFL_EVAL); lbl->pc_relative = !!(f & ObjFileLabel::OFL_ADDR); lbl->constant = !!(f & ObjFileLabel::OFL_CNST); lbl->external = external == ObjFileLabel::OFL_XDEF; lbl->reference = false; } // no protected labels => don't track as separate file if (file_index==(int)externals.size()) { file_index = -1; } for (int li = 0; li < hdr.late_evals; ++li) { struct ObjFileLateEval &le = aLateEval[li]; strref name = le.label.offs >= 0 ? strref(str_pool + le.label.offs) : strref(); Label *pLabel = GetLabel(name); if (pLabel) { if (pLabel->evaluated) { AddLateEval(name, le.address, le.scope, strref(str_pool + le.expression.offs), (LateEval::Type)le.type); LateEval &last = lateEval[lateEval.size()-1]; last.section = le.section >= 0 ? aSctRmp[le.section] : le.section; last.rept = le.rept; last.source_file = strref(); last.file_ref = file_index; } } else { AddLateEval(le.target, le.address, le.scope, strref(str_pool + le.expression.offs), strref(), (LateEval::Type)le.type); LateEval &last = lateEval[lateEval.size()-1]; last.section = le.section >= 0 ? aSctRmp[le.section] : le.section; last.rept = le.rept; last.file_ref = file_index; } } free(aSctRmp); // restore previous section current_section = &allSections[prevSection]; } else { return ERROR_NOT_AN_X65_OBJECT_FILE; } } return STATUS_OK; } // number of section types that can be merged enum OMFRecCode { OMFR_END = 0, OMFR_RELOC = 0xe2, // bytes.b, bitshift.b, offset.l, value.l OMFR_INTERSEG = 0xe3, // bytes.b, bitshift.b, offset.l, filenum.w, segnum.w, offsref.l OMFR_LCONST = 0xf2, // bytes.b, b,b,b, data.b[bytes] OMFR_cRELOC = 0xf5, // bytes.b, bitshift.b, offset.w, value.w OMFR_cINTERSEG = 0xf6, // bytes.b, bitshift.b, offset.w, segnum.b, offsref.w OMFR_SUPER = 0xf7, }; struct OMFSegHdr { uint8_t SegTotal[4]; // + Segment Segment Header size Body size uint8_t ResSpc[4]; // Number of 0x00 to add to the end of Body uint8_t Length[4]; // Memory Size Segment uint8_t pad1[1]; uint8_t LabLen[1]; // Length Names: 10 uint8_t NumLen[1]; // Size = 4 numbers uint8s uint8_t Version[1]; // OMF Version: 2 uint8_t BankSize[4]; // Size of a Bank: 64 KB code if, between 0 and 64 KB for Data uint8_t Kind[2]; // Type Segment uint8_t pad2[2]; uint8_t Org[4]; uint8_t Align[4]; // Alignment: 0, 64 or 256 KB uint8_t NumSEx[1]; // Little Endian: 0 for IIgs uint8_t pad3[1]; uint8_t SegNum[2]; // Segment Number: 1-> N uint8_t EntryPointOffset[4]; // Entry point in the Segment uint8_t DispNameOffset[2]; // Where the offset is located LoadName uint8_t DispDataOffset[2]; // Offset begins the Body Segment uint8_t tempOrg[4]; // }; // write a number of bytes of a value static void _writeNBytes(uint8_t *dest, int bytes, int value) { while (bytes--) { *dest++ = (uint8_t)value; value >>= 8; } } // sort relocs before writing GS OS reloc instructions static int sortRelocByOffs(const void *A, const void *B) { return ((const Reloc*)A)->section_offset - ((const Reloc*)B)->section_offset; } // Export an Apple II GS relocatable executable StatusCode Asm::WriteA2GS_OMF(strref filename, bool full_collapse) { // determine the section with startup code - either first loaded object file or current file int first_section = 0; for (int s = 1; s<(int)allSections.size(); s++) { if (allSections[s].type==ST_CODE && (allSections[first_section].type != ST_CODE || (!allSections[s].include_from && allSections[first_section].include_from))) first_section = s; } // collapse all section together that share the same name StatusCode status = MergeSectionsByName(first_section); if (status!=STATUS_OK) { return status; } // Zero page section for x65 implies addresses, OMF direct-page/stack seg implies size of direct page + stack // so resolve the zero page sections first status = LinkZP(); if (status!=STATUS_OK) { return status; } // full collapse means that all sections gets merged into one // code+data section and one bss section which will be appended if (full_collapse) { status = MergeAllSections(first_section); if (status!=STATUS_OK) { return status; } } // determine if there is a direct page stack int DP_Stack_Size = 0; // 0 => default size (don't include) for (std::vector

::iterator s = allSections.begin(); s != allSections.end(); ++s) { if (s->type==ST_ZEROPAGE) { s->type = ST_REMOVED; } if (s->type == ST_BSS && s->name.same_str("directpage_stack")) { DP_Stack_Size += s->addr_size(); s->type = ST_REMOVED; } } std::vector SegNum; // order of valid segments std::vector SegLookup; // inverse of SegNum SegNum.reserve(allSections.size()); SegLookup.reserve(allSections.size()); int reloc_max = 1; // OMF super instructions work by incremental addresses, sort relocs to simplify output for (std::vector

::iterator s = allSections.begin(); s != allSections.end(); ++s) { if (first_section==SectionId(*s)) { SegNum.insert(SegNum.begin(), SectionId(*s)); } else if (s->type!=ST_REMOVED) { SegNum.push_back(SectionId(*s)); } SegLookup.push_back(-1); if ((s->type == ST_CODE || s->type == ST_DATA) && s->pRelocs && s->pRelocs->size() > 1) { qsort(&(*s->pRelocs)[0], s->pRelocs->size(), sizeof(Reloc), sortRelocByOffs); if ((int)s->pRelocs->size()>reloc_max) { reloc_max = (int)s->pRelocs->size(); } } } // reloc_max needs to greater than zero if (reloc_max<1) { return ERROR_ABORTED; } for (std::vector::iterator i = SegNum.begin(); i!=SegNum.end(); ++i) { SegLookup[*i] = (int)(&*i-&SegNum[0]); } uint8_t *instructions = (uint8_t*)malloc(reloc_max * 16); if (!instructions) { return ERROR_OUT_OF_MEMORY; } // open a file for writing FILE *f = fopen(strown<512>(filename).c_str(), "wb"); if (!f) { free(instructions); return ERROR_CANT_WRITE_TO_FILE; } // consume all the relocs struct OMFSegHdr hdr = { 0 }; // initialize segment header hdr.NumLen[0] = 4; // numbers are 4 bytes under GS OS hdr.Version[0] = 2; // version is 2 for GS OS hdr.BankSize[2] = 1; // 64k banks _writeNBytes(hdr.DispNameOffset, 2, sizeof(hdr)); // start of file name (10 chars) strref fileBase = export_base_name; char segfile[10]; memset(segfile, ' ', 10); memcpy(segfile, fileBase.get(), fileBase.get_len() > 10 ? 10 : fileBase.get_len()); for (std::vector::iterator i = SegNum.begin(); i != SegNum.end(); ++i) { Section &s = allSections[*i]; strref segName = s.name ? s.name : (s.type == ST_CODE ? strref("CODE") : strref("DATA")); // support zero bytes at end of block int num_zeroes_at_end = s.addr_size() - s.size(); int num_bytes_file = s.size(); while (num_bytes_file && s.output[num_bytes_file - 1] == 0) { num_zeroes_at_end++; num_bytes_file--; } _writeNBytes(hdr.SegNum, 2, SegLookup[*i] + 1); _writeNBytes(hdr.Kind, 2, s.type == ST_CODE ? 0x1000 : (s.type == ST_ZEROPAGE ? 0x12 : 0x1001)); _writeNBytes(hdr.DispDataOffset, 2, sizeof(hdr) + 10 + 1 + (int)segName.get_len()); _writeNBytes(hdr.Length, 4, num_bytes_file + num_zeroes_at_end); _writeNBytes(hdr.ResSpc, 4, num_zeroes_at_end); _writeNBytes(hdr.Align, 4, s.align_address > 1 ? 256 : 0); // instruction list starts with a LCONST + Length(4) + binary, the relocs begin after that int instruction_offs = 0; instructions[instruction_offs++] = OMFR_LCONST; _writeNBytes(instructions+instruction_offs, 4, num_bytes_file); instruction_offs += 4; if (s.pRelocs && s.pRelocs->size()) { // insert all SUPER_RELOC2 / SUPER_RELOC3 for (int b = 0; b <= 1; b++) { int count_offs = -1; int prev_page = 0; int inst_curr = instruction_offs; instructions[inst_curr++] = OMFR_SUPER; int len_offs = inst_curr; inst_curr += 4; instructions[inst_curr++] = (uint8_t)b; // SUPER_RELOC2 / SUPER_RELOC3 // try all SUPER_RELOC2 (2 bytes self reference, no shift) relocList::iterator r = s.pRelocs->begin(); while (r != s.pRelocs->end()) { if (r->shift == 0 && r->bytes == (b+2) && r->target_section == SectionId(s)) { if ((r->section_offset >> 8) != prev_page) { instructions[inst_curr++] = uint8_t(0x80 | ((r->section_offset >> 8) - prev_page - 1)); count_offs = -1; } // update patch counter for current page or add a new counter if (count_offs < 0) { count_offs = inst_curr; instructions[inst_curr++] = 0; } else instructions[count_offs]++; prev_page = r->section_offset>>8; instructions[inst_curr++] = (uint8_t)r->section_offset; // write patch offset into binary _writeNBytes(s.output + r->section_offset, b + 2, r->base_value); // patch binary with base value r = s.pRelocs->erase(r); } else ++r; } if (inst_curr > (instruction_offs + 6)) { _writeNBytes(instructions + len_offs, 4, inst_curr - instruction_offs - 5); instruction_offs = inst_curr; } } // insert all other records as they are encountered relocList::iterator r = s.pRelocs->begin(); while (r != s.pRelocs->end()) { if (r->target_section == SectionId(s)) { // this is a reloc, check if cRELOC is ok or if need RELOC bool cRELOC = r->section_offset < 0x10000 && r->base_value < 0x10000; instructions[instruction_offs++] = uint8_t(cRELOC ? OMFR_cRELOC : OMFR_RELOC); instructions[instruction_offs++] = r->bytes; instructions[instruction_offs++] = r->shift; _writeNBytes(instructions + instruction_offs, cRELOC ? 2 : 4, r->section_offset); instruction_offs += cRELOC ? 2 : 4; _writeNBytes(instructions + instruction_offs, cRELOC ? 2 : 4, r->base_value); instruction_offs += cRELOC ? 2 : 4; } else { // this is an interseg bool cINTERSEG = r->section_offset < 0x10000 && r->base_value < 0x10000; instructions[instruction_offs++] = uint8_t(cINTERSEG ? OMFR_cINTERSEG : OMFR_INTERSEG); instructions[instruction_offs++] = r->bytes; instructions[instruction_offs++] = r->shift; _writeNBytes(instructions + instruction_offs, cINTERSEG ? 2 : 4, r->section_offset); instruction_offs += cINTERSEG ? 2 : 4; _writeNBytes(instructions + instruction_offs, cINTERSEG ? 0: 2 , 1); // file number = 1 instruction_offs += cINTERSEG ? 0 : 2; _writeNBytes(instructions + instruction_offs, cINTERSEG ? 1 : 2, SegLookup[r->target_section] + 1); // segment number starting from 1 instruction_offs += cINTERSEG ? 1 : 2; _writeNBytes(instructions + instruction_offs, cINTERSEG ? 2 : 4, r->base_value); instruction_offs += cINTERSEG ? 2 : 4; } r = s.pRelocs->erase(r); } } instructions[instruction_offs++] = OMFR_END; // size of seg = file header + 10 bytes file name + 1 byte seg name length + seg nameh + seg.addr_size() + instruction_size int segSize = sizeof(hdr) + 10 + 1 + (int)segName.get_len() + num_bytes_file + instruction_offs; if (num_bytes_file==0) { segSize -= 5; } _writeNBytes(hdr.SegTotal, 4, segSize); uint8_t lenSegName = (uint8_t)segName.get_len(); fwrite(&hdr, sizeof(hdr), 1, f); fwrite(segfile, 10, 1, f); fwrite(&lenSegName, 1, 1, f); fwrite(segName.get(), segName.get_len(), 1, f); if (num_bytes_file) { fwrite(instructions, 5, 1, f); // $f2 + 4 bytes data size fwrite(s.output, num_bytes_file, 1, f); // segment data } if (instruction_offs > 5) fwrite(instructions + 5, instruction_offs - 5, 1, f); // reloc instructions } // if there is a size of the direct page & stack, write it if (DP_Stack_Size) { strref segName("DPStack"); char lenSegName = (char)segName.get_len(); _writeNBytes(hdr.SegNum, 2, (int)SegNum.size()+1); _writeNBytes(hdr.Kind, 2, 0x12); _writeNBytes(hdr.DispDataOffset, 2, sizeof(hdr) + 10 + 1 + (int)segName.get_len()); _writeNBytes(hdr.Length, 4, DP_Stack_Size); _writeNBytes(hdr.ResSpc, 4, DP_Stack_Size); _writeNBytes(hdr.Align, 4, 256); int segSize = sizeof(hdr) + 10 + 1 + (int)segName.get_len() + 1; _writeNBytes(hdr.SegTotal, 4, segSize); instructions[0] = 0; fwrite(&hdr, sizeof(hdr), 1, f); fwrite(segfile, 10, 1, f); fwrite(&lenSegName, 1, 1, f); fwrite(segName.get(), segName.get_len(), 1, f); fwrite(instructions, 1, 1, f); // end instruction } free(instructions); fclose(f); return STATUS_OK; } int main(int argc, char **argv) { const strref listing("lst"); const strref allinstr("opcodes"); const strref endmacro("endm"); const strref cpu("cpu"); const strref acc("acc"); const strref xy("xy"); const strref org("org"); int return_value = 0; bool load_header = true; bool size_header = false; bool info = false; bool gen_allinstr = false; bool gs_os_reloc = false; bool force_merge_sections = false; Asm assembler; const char *source_filename = nullptr, *obj_out_file = nullptr; const char *binary_out_name = nullptr; const char *sym_file = nullptr, *vs_file = nullptr; strref list_file, allinstr_file; for (int a = 1; a1) { assembler.default_org = (int)(arg+1).ahextoui(); } else if (arg.is_number()) { assembler.default_org = (int)arg.atoi(); } // force the current section to be org'd assembler.AssignAddressToSection(assembler.SectionId(), assembler.default_org); } else if (arg.has_prefix(acc)&&arg[acc.get_len()]=='=') { assembler.accumulator_16bit = arg.after('=').atoi()==16; } else if (arg.has_prefix(xy)&&arg[xy.get_len()]=='=') { assembler.index_reg_16bit = arg.after('=').atoi()==16; } else if (arg.has_prefix(cpu)&&(arg.get_len()==cpu.get_len()||arg[cpu.get_len()]=='=')) { arg.split_token_trim('='); bool found = false; for (int c = 0; c FIRST_ERROR) { assembler.PrintError(strref(), err); return_value = 1; } int numExportFiles = assembler.GetExportNames(aAppendNames, MAX_EXPORT_FILES); for (int e = 0; e < numExportFiles; e++) { strown<512> file(binout); file.append(aAppendNames[e]); file.append('.'); file.append(ext); int size_export; int addr; if (uint8_t *buf = assembler.BuildExport(aAppendNames[e], size_export, addr)) { if (FILE *f = fopen(file.c_str(), "wb")) { if (load_header) { uint8_t load_addr[2] = { (uint8_t)addr, (uint8_t)(addr >> 8) }; fwrite(load_addr, 2, 1, f); } if (size_header) { uint8_t byte_size[2] = { (uint8_t)size_export, (uint8_t)(size_export >> 8) }; fwrite(byte_size, 2, 1, f); } fwrite(buf, size_export, 1, f); fclose(f); } free(buf); } } } } // print encountered sections info if (info) { printf("SECTIONS SUMMARY\n================\n"); for (size_t i = 0; i < assembler.allSections.size(); ++i) { Section &s = assembler.allSections[i]; if (s.address > s.start_address) { printf("Section %d: \"" STRREF_FMT "\" Dummy: %s Relative: %s Merged: %s Start: 0x%04x End: 0x%04x\n", (int)i, STRREF_ARG(s.name), s.dummySection ? "yes" : "no", s.IsRelativeSection() ? "yes" : "no", s.IsMergedSection() ? "yes" : "no", s.start_address, s.address); if (s.pRelocs) { for (relocList::iterator rel = s.pRelocs->begin(); rel != s.pRelocs->end(); ++rel) printf("\tReloc value $%x at offs $%x section %d\n", rel->base_value, rel->section_offset, rel->target_section); } } } } // listing after export since addresses are now resolved if (assembler.list_assembly) assembler.List(list_file); // export .sym file if (sym_file && !srcname.same_str(sym_file) && !assembler.map.empty()) { if (FILE *f = fopen(sym_file, "w")) { bool wasLocal = false; for (MapSymbolArray::iterator i = assembler.map.begin(); i!=assembler.map.end(); ++i) { uint32_t value = (uint32_t)i->value; int section = i->section; while (section >= 0 && section < (int)assembler.allSections.size()) { if (assembler.allSections[section].IsMergedSection()) { value += assembler.allSections[section].merged_offset; section = assembler.allSections[section].merged_section; } else { value += assembler.allSections[section].start_address; break; } } fprintf(f, "%s.label " STRREF_FMT " = $%04x", wasLocal==i->local ? "\n" : (i->local ? " {\n" : "\n}\n"), STRREF_ARG(i->name), value); wasLocal = i->local; } fputs(wasLocal ? "\n}\n" : "\n", f); fclose(f); } } // export vice monitor commands if (vs_file && !srcname.same_str(vs_file) && !assembler.map.empty()) { if (FILE *f = fopen(vs_file, "w")) { for (MapSymbolArray::iterator i = assembler.map.begin(); i!=assembler.map.end(); ++i) { uint32_t value = (uint32_t)i->value; int section = i->section; while (section >= 0 && section < (int)assembler.allSections.size()) { if (assembler.allSections[section].IsMergedSection()) { value += assembler.allSections[section].merged_offset; section = assembler.allSections[section].merged_section; } else { value += assembler.allSections[section].start_address; break; } } if(i->name.same_str("debugbreak")) { fprintf(f, "break $%04x\n", value); } else { fprintf(f, "al $%04x %s" STRREF_FMT "\n", value, i->name[0]=='.' ? "" : ".", STRREF_ARG(i->name)); } } fclose(f); } } } // free some memory assembler.Cleanup(); } } return return_value; }