1 //===-- llvm/MC/MCMachObjectWriter.h - Mach Object Writer -------*- C++ -*-===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 #ifndef LLVM_MC_MCMACHOBJECTWRITER_H
11 #define LLVM_MC_MCMACHOBJECTWRITER_H
13 #include "llvm/ADT/DenseMap.h"
14 #include "llvm/ADT/SmallString.h"
15 #include "llvm/MC/MCExpr.h"
16 #include "llvm/MC/MCObjectWriter.h"
17 #include "llvm/MC/StringTableBuilder.h"
18 #include "llvm/Support/DataTypes.h"
19 #include "llvm/Support/MachO.h"
25 class MachObjectWriter;
27 class MCMachObjectTargetWriter {
28 const unsigned Is64Bit : 1;
29 const uint32_t CPUType;
30 const uint32_t CPUSubtype;
31 // FIXME: Remove this, we should just always use it once we no longer care
32 // about Darwin 'as' compatibility.
33 const unsigned UseAggressiveSymbolFolding : 1;
34 unsigned LocalDifference_RIT;
37 MCMachObjectTargetWriter(bool Is64Bit_, uint32_t CPUType_,
39 bool UseAggressiveSymbolFolding_ = false);
41 void setLocalDifferenceRelocationType(unsigned Type) {
42 LocalDifference_RIT = Type;
46 virtual ~MCMachObjectTargetWriter();
48 /// @name Lifetime Management
51 virtual void reset() {};
58 bool is64Bit() const { return Is64Bit; }
59 bool useAggressiveSymbolFolding() const { return UseAggressiveSymbolFolding; }
60 uint32_t getCPUType() const { return CPUType; }
61 uint32_t getCPUSubtype() const { return CPUSubtype; }
62 unsigned getLocalDifferenceRelocationType() const {
63 return LocalDifference_RIT;
71 virtual void RecordRelocation(MachObjectWriter *Writer, MCAssembler &Asm,
72 const MCAsmLayout &Layout,
73 const MCFragment *Fragment,
74 const MCFixup &Fixup, MCValue Target,
75 uint64_t &FixedValue) = 0;
80 class MachObjectWriter : public MCObjectWriter {
81 /// MachSymbolData - Helper struct for containing some precomputed information
83 struct MachSymbolData {
84 MCSymbolData *SymbolData;
88 // Support lexicographic sorting.
89 bool operator<(const MachSymbolData &RHS) const;
92 /// The target specific Mach-O writer instance.
93 std::unique_ptr<MCMachObjectTargetWriter> TargetObjectWriter;
95 /// @name Relocation Data
99 const MCSymbolData *Sym;
100 MachO::any_relocation_info MRE;
101 RelAndSymbol(const MCSymbolData *Sym, const MachO::any_relocation_info &MRE)
102 : Sym(Sym), MRE(MRE) {}
105 llvm::DenseMap<const MCSectionData *, std::vector<RelAndSymbol>> Relocations;
106 llvm::DenseMap<const MCSectionData*, unsigned> IndirectSymBase;
109 /// @name Symbol Table Data
112 StringTableBuilder StringTable;
113 std::vector<MachSymbolData> LocalSymbolData;
114 std::vector<MachSymbolData> ExternalSymbolData;
115 std::vector<MachSymbolData> UndefinedSymbolData;
119 MachSymbolData *findSymbolData(const MCSymbol &Sym);
122 MachObjectWriter(MCMachObjectTargetWriter *MOTW, raw_ostream &OS,
124 : MCObjectWriter(OS, IsLittleEndian), TargetObjectWriter(MOTW) {}
126 /// @name Lifetime management Methods
129 void reset() override;
133 /// @name Utility Methods
136 bool isFixupKindPCRel(const MCAssembler &Asm, unsigned Kind);
138 SectionAddrMap SectionAddress;
140 SectionAddrMap &getSectionAddressMap() { return SectionAddress; }
142 uint64_t getSectionAddress(const MCSectionData* SD) const {
143 return SectionAddress.lookup(SD);
145 uint64_t getSymbolAddress(const MCSymbolData* SD,
146 const MCAsmLayout &Layout) const;
148 uint64_t getFragmentAddress(const MCFragment *Fragment,
149 const MCAsmLayout &Layout) const;
151 uint64_t getPaddingSize(const MCSectionData *SD,
152 const MCAsmLayout &Layout) const;
154 bool doesSymbolRequireExternRelocation(const MCSymbolData *SD);
158 /// @name Target Writer Proxy Accessors
161 bool is64Bit() const { return TargetObjectWriter->is64Bit(); }
162 bool isX86_64() const {
163 uint32_t CPUType = TargetObjectWriter->getCPUType();
164 return CPUType == MachO::CPU_TYPE_X86_64;
169 void WriteHeader(unsigned NumLoadCommands, unsigned LoadCommandsSize,
170 bool SubsectionsViaSymbols);
172 /// WriteSegmentLoadCommand - Write a segment load command.
174 /// \param NumSections The number of sections in this segment.
175 /// \param SectionDataSize The total size of the sections.
176 void WriteSegmentLoadCommand(unsigned NumSections,
178 uint64_t SectionDataStartOffset,
179 uint64_t SectionDataSize);
181 void WriteSection(const MCAssembler &Asm, const MCAsmLayout &Layout,
182 const MCSectionData &SD, uint64_t FileOffset,
183 uint64_t RelocationsStart, unsigned NumRelocations);
185 void WriteSymtabLoadCommand(uint32_t SymbolOffset, uint32_t NumSymbols,
186 uint32_t StringTableOffset,
187 uint32_t StringTableSize);
189 void WriteDysymtabLoadCommand(uint32_t FirstLocalSymbol,
190 uint32_t NumLocalSymbols,
191 uint32_t FirstExternalSymbol,
192 uint32_t NumExternalSymbols,
193 uint32_t FirstUndefinedSymbol,
194 uint32_t NumUndefinedSymbols,
195 uint32_t IndirectSymbolOffset,
196 uint32_t NumIndirectSymbols);
198 void WriteNlist(MachSymbolData &MSD, const MCAsmLayout &Layout);
200 void WriteLinkeditLoadCommand(uint32_t Type, uint32_t DataOffset,
203 void WriteLinkerOptionsLoadCommand(const std::vector<std::string> &Options);
205 // FIXME: We really need to improve the relocation validation. Basically, we
206 // want to implement a separate computation which evaluates the relocation
207 // entry as the linker would, and verifies that the resultant fixup value is
208 // exactly what the encoder wanted. This will catch several classes of
211 // - Relocation entry bugs, the two algorithms are unlikely to have the same
214 // - Relaxation issues, where we forget to relax something.
216 // - Input errors, where something cannot be correctly encoded. 'as' allows
217 // these through in many cases.
219 // Add a relocation to be output in the object file. At the time this is
220 // called, the symbol indexes are not know, so if the relocation refers
221 // to a symbol it should be passed as \p RelSymbol so that it can be updated
222 // afterwards. If the relocation doesn't refer to a symbol, nullptr should be
224 void addRelocation(const MCSymbolData *RelSymbol, const MCSectionData *SD,
225 MachO::any_relocation_info &MRE) {
226 RelAndSymbol P(RelSymbol, MRE);
227 Relocations[SD].push_back(P);
230 void RecordScatteredRelocation(const MCAssembler &Asm,
231 const MCAsmLayout &Layout,
232 const MCFragment *Fragment,
233 const MCFixup &Fixup, MCValue Target,
235 uint64_t &FixedValue);
237 void RecordTLVPRelocation(const MCAssembler &Asm,
238 const MCAsmLayout &Layout,
239 const MCFragment *Fragment,
240 const MCFixup &Fixup, MCValue Target,
241 uint64_t &FixedValue);
243 void RecordRelocation(MCAssembler &Asm, const MCAsmLayout &Layout,
244 const MCFragment *Fragment, const MCFixup &Fixup,
245 MCValue Target, bool &IsPCRel,
246 uint64_t &FixedValue) override;
248 void BindIndirectSymbols(MCAssembler &Asm);
250 /// ComputeSymbolTable - Compute the symbol table data
252 void ComputeSymbolTable(MCAssembler &Asm,
253 std::vector<MachSymbolData> &LocalSymbolData,
254 std::vector<MachSymbolData> &ExternalSymbolData,
255 std::vector<MachSymbolData> &UndefinedSymbolData);
257 void computeSectionAddresses(const MCAssembler &Asm,
258 const MCAsmLayout &Layout);
260 void ExecutePostLayoutBinding(MCAssembler &Asm,
261 const MCAsmLayout &Layout) override;
263 bool IsSymbolRefDifferenceFullyResolvedImpl(const MCAssembler &Asm,
264 const MCSymbolData &DataA,
265 const MCFragment &FB,
267 bool IsPCRel) const override;
269 void WriteObject(MCAssembler &Asm, const MCAsmLayout &Layout) override;
273 /// \brief Construct a new Mach-O writer instance.
275 /// This routine takes ownership of the target writer subclass.
277 /// \param MOTW - The target specific Mach-O writer subclass.
278 /// \param OS - The stream to write to.
279 /// \returns The constructed object writer.
280 MCObjectWriter *createMachObjectWriter(MCMachObjectTargetWriter *MOTW,
281 raw_ostream &OS, bool IsLittleEndian);
283 } // End llvm namespace