mirror of
				https://github.com/c64scene-ar/llvm-6502.git
				synced 2025-10-30 16:17:05 +00:00 
			
		
		
		
	The fixes are to note that AArch64 has additional restrictions on when local relocations can be used. In particular, ld64 requires that relocations to cstring/cfstrings use linker visible symbols. Original message: In an assembly expression like bar: .long L0 + 1 the intended semantics is that bar will contain a pointer one byte past L0. In sections that are merged by content (strings, 4 byte constants, etc), a single position in the section doesn't give the linker enough information. For example, it would not be able to tell a relocation must point to the end of a string, since that would look just like the start of the next. The solution used in ELF to use relocation with symbols if there is a non-zero addend. In MachO before this patch we would just keep all symbols in some sections. This would miss some cases (only cstrings on x86_64 were implemented) and was inefficient since most relocations have an addend of 0 and can be represented without the symbol. This patch implements the non-zero addend logic for MachO too. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@226503 91177308-0d34-0410-b5e6-96231b3b80d8
		
			
				
	
	
		
			289 lines
		
	
	
		
			9.7 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			289 lines
		
	
	
		
			9.7 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| //===-- llvm/MC/MCMachObjectWriter.h - Mach Object Writer -------*- C++ -*-===//
 | |
| //
 | |
| //                     The LLVM Compiler Infrastructure
 | |
| //
 | |
| // This file is distributed under the University of Illinois Open Source
 | |
| // License. See LICENSE.TXT for details.
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| 
 | |
| #ifndef LLVM_MC_MCMACHOBJECTWRITER_H
 | |
| #define LLVM_MC_MCMACHOBJECTWRITER_H
 | |
| 
 | |
| #include "llvm/ADT/DenseMap.h"
 | |
| #include "llvm/ADT/SmallString.h"
 | |
| #include "llvm/MC/MCExpr.h"
 | |
| #include "llvm/MC/MCObjectWriter.h"
 | |
| #include "llvm/MC/StringTableBuilder.h"
 | |
| #include "llvm/Support/DataTypes.h"
 | |
| #include "llvm/Support/MachO.h"
 | |
| #include <vector>
 | |
| 
 | |
| namespace llvm {
 | |
| 
 | |
| class MCSectionData;
 | |
| class MachObjectWriter;
 | |
| 
 | |
| class MCMachObjectTargetWriter {
 | |
|   const unsigned Is64Bit : 1;
 | |
|   const uint32_t CPUType;
 | |
|   const uint32_t CPUSubtype;
 | |
|   // FIXME: Remove this, we should just always use it once we no longer care
 | |
|   // about Darwin 'as' compatibility.
 | |
|   const unsigned UseAggressiveSymbolFolding : 1;
 | |
|   unsigned LocalDifference_RIT;
 | |
| 
 | |
| protected:
 | |
|   MCMachObjectTargetWriter(bool Is64Bit_, uint32_t CPUType_,
 | |
|                            uint32_t CPUSubtype_,
 | |
|                            bool UseAggressiveSymbolFolding_ = false);
 | |
| 
 | |
|   void setLocalDifferenceRelocationType(unsigned Type) {
 | |
|     LocalDifference_RIT = Type;
 | |
|   }
 | |
| 
 | |
| public:
 | |
|   virtual ~MCMachObjectTargetWriter();
 | |
| 
 | |
|   /// @name Lifetime Management
 | |
|   /// @{
 | |
| 
 | |
|   virtual void reset() {};
 | |
| 
 | |
|   /// @}
 | |
| 
 | |
|   /// @name Accessors
 | |
|   /// @{
 | |
| 
 | |
|   bool is64Bit() const { return Is64Bit; }
 | |
|   bool useAggressiveSymbolFolding() const { return UseAggressiveSymbolFolding; }
 | |
|   uint32_t getCPUType() const { return CPUType; }
 | |
|   uint32_t getCPUSubtype() const { return CPUSubtype; }
 | |
|   unsigned getLocalDifferenceRelocationType() const {
 | |
|     return LocalDifference_RIT;
 | |
|   }
 | |
| 
 | |
|   /// @}
 | |
| 
 | |
|   /// @name API
 | |
|   /// @{
 | |
| 
 | |
|   virtual void RecordRelocation(MachObjectWriter *Writer, MCAssembler &Asm,
 | |
|                                 const MCAsmLayout &Layout,
 | |
|                                 const MCFragment *Fragment,
 | |
|                                 const MCFixup &Fixup, MCValue Target,
 | |
|                                 uint64_t &FixedValue) = 0;
 | |
| 
 | |
|   /// @}
 | |
| };
 | |
| 
 | |
| class MachObjectWriter : public MCObjectWriter {
 | |
|   /// MachSymbolData - Helper struct for containing some precomputed information
 | |
|   /// on symbols.
 | |
|   struct MachSymbolData {
 | |
|     MCSymbolData *SymbolData;
 | |
|     uint64_t StringIndex;
 | |
|     uint8_t SectionIndex;
 | |
| 
 | |
|     // Support lexicographic sorting.
 | |
|     bool operator<(const MachSymbolData &RHS) const;
 | |
|   };
 | |
| 
 | |
|   /// The target specific Mach-O writer instance.
 | |
|   std::unique_ptr<MCMachObjectTargetWriter> TargetObjectWriter;
 | |
| 
 | |
|   /// @name Relocation Data
 | |
|   /// @{
 | |
| 
 | |
|   struct RelAndSymbol {
 | |
|     const MCSymbolData *Sym;
 | |
|     MachO::any_relocation_info MRE;
 | |
|     RelAndSymbol(const MCSymbolData *Sym, const MachO::any_relocation_info &MRE)
 | |
|         : Sym(Sym), MRE(MRE) {}
 | |
|   };
 | |
| 
 | |
|   llvm::DenseMap<const MCSectionData *, std::vector<RelAndSymbol>> Relocations;
 | |
|   llvm::DenseMap<const MCSectionData*, unsigned> IndirectSymBase;
 | |
| 
 | |
|   /// @}
 | |
|   /// @name Symbol Table Data
 | |
|   /// @{
 | |
| 
 | |
|   StringTableBuilder StringTable;
 | |
|   std::vector<MachSymbolData> LocalSymbolData;
 | |
|   std::vector<MachSymbolData> ExternalSymbolData;
 | |
|   std::vector<MachSymbolData> UndefinedSymbolData;
 | |
| 
 | |
|   /// @}
 | |
| 
 | |
|   MachSymbolData *findSymbolData(const MCSymbol &Sym);
 | |
| 
 | |
| public:
 | |
|   MachObjectWriter(MCMachObjectTargetWriter *MOTW, raw_ostream &_OS,
 | |
|                    bool _IsLittleEndian)
 | |
|     : MCObjectWriter(_OS, _IsLittleEndian), TargetObjectWriter(MOTW) {
 | |
|   }
 | |
| 
 | |
|   /// @name Lifetime management Methods
 | |
|   /// @{
 | |
| 
 | |
|   void reset() override;
 | |
| 
 | |
|   /// @}
 | |
| 
 | |
|   /// @name Utility Methods
 | |
|   /// @{
 | |
| 
 | |
|   bool isFixupKindPCRel(const MCAssembler &Asm, unsigned Kind);
 | |
| 
 | |
|   SectionAddrMap SectionAddress;
 | |
| 
 | |
|   SectionAddrMap &getSectionAddressMap() { return SectionAddress; }
 | |
| 
 | |
|   uint64_t getSectionAddress(const MCSectionData* SD) const {
 | |
|     return SectionAddress.lookup(SD);
 | |
|   }
 | |
|   uint64_t getSymbolAddress(const MCSymbolData* SD,
 | |
|                             const MCAsmLayout &Layout) const;
 | |
| 
 | |
|   uint64_t getFragmentAddress(const MCFragment *Fragment,
 | |
|                               const MCAsmLayout &Layout) const;
 | |
| 
 | |
|   uint64_t getPaddingSize(const MCSectionData *SD,
 | |
|                           const MCAsmLayout &Layout) const;
 | |
| 
 | |
|   bool doesSymbolRequireExternRelocation(const MCSymbolData *SD);
 | |
| 
 | |
|   /// @}
 | |
| 
 | |
|   /// @name Target Writer Proxy Accessors
 | |
|   /// @{
 | |
| 
 | |
|   bool is64Bit() const { return TargetObjectWriter->is64Bit(); }
 | |
|   bool isX86_64() const {
 | |
|     uint32_t CPUType = TargetObjectWriter->getCPUType();
 | |
|     return CPUType == MachO::CPU_TYPE_X86_64;
 | |
|   }
 | |
| 
 | |
|   /// @}
 | |
| 
 | |
|   void WriteHeader(unsigned NumLoadCommands, unsigned LoadCommandsSize,
 | |
|                    bool SubsectionsViaSymbols);
 | |
| 
 | |
|   /// WriteSegmentLoadCommand - Write a segment load command.
 | |
|   ///
 | |
|   /// \param NumSections The number of sections in this segment.
 | |
|   /// \param SectionDataSize The total size of the sections.
 | |
|   void WriteSegmentLoadCommand(unsigned NumSections,
 | |
|                                uint64_t VMSize,
 | |
|                                uint64_t SectionDataStartOffset,
 | |
|                                uint64_t SectionDataSize);
 | |
| 
 | |
|   void WriteSection(const MCAssembler &Asm, const MCAsmLayout &Layout,
 | |
|                     const MCSectionData &SD, uint64_t FileOffset,
 | |
|                     uint64_t RelocationsStart, unsigned NumRelocations);
 | |
| 
 | |
|   void WriteSymtabLoadCommand(uint32_t SymbolOffset, uint32_t NumSymbols,
 | |
|                               uint32_t StringTableOffset,
 | |
|                               uint32_t StringTableSize);
 | |
| 
 | |
|   void WriteDysymtabLoadCommand(uint32_t FirstLocalSymbol,
 | |
|                                 uint32_t NumLocalSymbols,
 | |
|                                 uint32_t FirstExternalSymbol,
 | |
|                                 uint32_t NumExternalSymbols,
 | |
|                                 uint32_t FirstUndefinedSymbol,
 | |
|                                 uint32_t NumUndefinedSymbols,
 | |
|                                 uint32_t IndirectSymbolOffset,
 | |
|                                 uint32_t NumIndirectSymbols);
 | |
| 
 | |
|   void WriteNlist(MachSymbolData &MSD, const MCAsmLayout &Layout);
 | |
| 
 | |
|   void WriteLinkeditLoadCommand(uint32_t Type, uint32_t DataOffset,
 | |
|                                 uint32_t DataSize);
 | |
| 
 | |
|   void WriteLinkerOptionsLoadCommand(const std::vector<std::string> &Options);
 | |
| 
 | |
|   // FIXME: We really need to improve the relocation validation. Basically, we
 | |
|   // want to implement a separate computation which evaluates the relocation
 | |
|   // entry as the linker would, and verifies that the resultant fixup value is
 | |
|   // exactly what the encoder wanted. This will catch several classes of
 | |
|   // problems:
 | |
|   //
 | |
|   //  - Relocation entry bugs, the two algorithms are unlikely to have the same
 | |
|   //    exact bug.
 | |
|   //
 | |
|   //  - Relaxation issues, where we forget to relax something.
 | |
|   //
 | |
|   //  - Input errors, where something cannot be correctly encoded. 'as' allows
 | |
|   //    these through in many cases.
 | |
| 
 | |
|   // Add a relocation to be output in the object file. At the time this is
 | |
|   // called, the symbol indexes are not know, so if the relocation refers
 | |
|   // to a symbol it should be passed as \p RelSymbol so that it can be updated
 | |
|   // afterwards. If the relocation doesn't refer to a symbol, nullptr should be
 | |
|   // used.
 | |
|   void addRelocation(const MCSymbolData *RelSymbol, const MCSectionData *SD,
 | |
|                      MachO::any_relocation_info &MRE) {
 | |
|     RelAndSymbol P(RelSymbol, MRE);
 | |
|     Relocations[SD].push_back(P);
 | |
|   }
 | |
| 
 | |
|   void RecordScatteredRelocation(const MCAssembler &Asm,
 | |
|                                  const MCAsmLayout &Layout,
 | |
|                                  const MCFragment *Fragment,
 | |
|                                  const MCFixup &Fixup, MCValue Target,
 | |
|                                  unsigned Log2Size,
 | |
|                                  uint64_t &FixedValue);
 | |
| 
 | |
|   void RecordTLVPRelocation(const MCAssembler &Asm,
 | |
|                             const MCAsmLayout &Layout,
 | |
|                             const MCFragment *Fragment,
 | |
|                             const MCFixup &Fixup, MCValue Target,
 | |
|                             uint64_t &FixedValue);
 | |
| 
 | |
|   void RecordRelocation(MCAssembler &Asm, const MCAsmLayout &Layout,
 | |
|                         const MCFragment *Fragment, const MCFixup &Fixup,
 | |
|                         MCValue Target, bool &IsPCRel,
 | |
|                         uint64_t &FixedValue) override;
 | |
| 
 | |
|   void BindIndirectSymbols(MCAssembler &Asm);
 | |
| 
 | |
|   /// ComputeSymbolTable - Compute the symbol table data
 | |
|   ///
 | |
|   void ComputeSymbolTable(MCAssembler &Asm,
 | |
|                           std::vector<MachSymbolData> &LocalSymbolData,
 | |
|                           std::vector<MachSymbolData> &ExternalSymbolData,
 | |
|                           std::vector<MachSymbolData> &UndefinedSymbolData);
 | |
| 
 | |
|   void computeSectionAddresses(const MCAssembler &Asm,
 | |
|                                const MCAsmLayout &Layout);
 | |
| 
 | |
|   void markAbsoluteVariableSymbols(MCAssembler &Asm,
 | |
|                                    const MCAsmLayout &Layout);
 | |
|   void ExecutePostLayoutBinding(MCAssembler &Asm,
 | |
|                                 const MCAsmLayout &Layout) override;
 | |
| 
 | |
|   bool IsSymbolRefDifferenceFullyResolvedImpl(const MCAssembler &Asm,
 | |
|                                               const MCSymbolData &DataA,
 | |
|                                               const MCFragment &FB,
 | |
|                                               bool InSet,
 | |
|                                               bool IsPCRel) const override;
 | |
| 
 | |
|   void WriteObject(MCAssembler &Asm, const MCAsmLayout &Layout) override;
 | |
| };
 | |
| 
 | |
| 
 | |
| /// \brief Construct a new Mach-O writer instance.
 | |
| ///
 | |
| /// This routine takes ownership of the target writer subclass.
 | |
| ///
 | |
| /// \param MOTW - The target specific Mach-O writer subclass.
 | |
| /// \param OS - The stream to write to.
 | |
| /// \returns The constructed object writer.
 | |
| MCObjectWriter *createMachObjectWriter(MCMachObjectTargetWriter *MOTW,
 | |
|                                        raw_ostream &OS, bool IsLittleEndian);
 | |
| 
 | |
| } // End llvm namespace
 | |
| 
 | |
| #endif
 |