MCAssembler.h revision f3014761c955345d6e05491608e73228d014afb7
1//===- MCAssembler.h - Object File Generation -------------------*- C++ -*-===// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9 10#ifndef LLVM_MC_MCASSEMBLER_H 11#define LLVM_MC_MCASSEMBLER_H 12 13#include "llvm/ADT/ArrayRef.h" 14#include "llvm/ADT/STLExtras.h" 15#include "llvm/ADT/SmallPtrSet.h" 16#include "llvm/ADT/StringRef.h" 17#include "llvm/ADT/iterator.h" 18#include "llvm/ADT/iterator_range.h" 19#include "llvm/MC/MCDirectives.h" 20#include "llvm/MC/MCDwarf.h" 21#include "llvm/MC/MCFixup.h" 22#include "llvm/MC/MCFragment.h" 23#include "llvm/MC/MCLinkerOptimizationHint.h" 24#include "llvm/MC/MCSymbol.h" 25#include <cassert> 26#include <cstddef> 27#include <cstdint> 28#include <string> 29#include <utility> 30#include <vector> 31 32namespace llvm { 33 34class MCAsmBackend; 35class MCAsmLayout; 36class MCContext; 37class MCCodeEmitter; 38class MCFragment; 39class MCObjectWriter; 40class MCSection; 41class MCValue; 42 43// FIXME: This really doesn't belong here. See comments below. 44struct IndirectSymbolData { 45 MCSymbol *Symbol; 46 MCSection *Section; 47}; 48 49// FIXME: Ditto this. Purely so the Streamer and the ObjectWriter can talk 50// to one another. 51struct DataRegionData { 52 // This enum should be kept in sync w/ the mach-o definition in 53 // llvm/Object/MachOFormat.h. 54 enum KindTy { Data = 1, JumpTable8, JumpTable16, JumpTable32 } Kind; 55 MCSymbol *Start; 56 MCSymbol *End; 57}; 58 59class MCAssembler { 60 friend class MCAsmLayout; 61 62public: 63 using SectionListType = std::vector<MCSection *>; 64 using SymbolDataListType = std::vector<const MCSymbol *>; 65 66 using const_iterator = pointee_iterator<SectionListType::const_iterator>; 67 using iterator = pointee_iterator<SectionListType::iterator>; 68 69 using const_symbol_iterator = 70 pointee_iterator<SymbolDataListType::const_iterator>; 71 using symbol_iterator = pointee_iterator<SymbolDataListType::iterator>; 72 73 using symbol_range = iterator_range<symbol_iterator>; 74 using const_symbol_range = iterator_range<const_symbol_iterator>; 75 76 using const_indirect_symbol_iterator = 77 std::vector<IndirectSymbolData>::const_iterator; 78 using indirect_symbol_iterator = std::vector<IndirectSymbolData>::iterator; 79 80 using const_data_region_iterator = 81 std::vector<DataRegionData>::const_iterator; 82 using data_region_iterator = std::vector<DataRegionData>::iterator; 83 84 /// MachO specific deployment target version info. 85 // A Major version of 0 indicates that no version information was supplied 86 // and so the corresponding load command should not be emitted. 87 using VersionMinInfoType = struct { 88 MCVersionMinType Kind; 89 unsigned Major; 90 unsigned Minor; 91 unsigned Update; 92 }; 93 94private: 95 MCContext &Context; 96 97 MCAsmBackend &Backend; 98 99 MCCodeEmitter &Emitter; 100 101 MCObjectWriter &Writer; 102 103 SectionListType Sections; 104 105 SymbolDataListType Symbols; 106 107 std::vector<IndirectSymbolData> IndirectSymbols; 108 109 std::vector<DataRegionData> DataRegions; 110 111 /// The list of linker options to propagate into the object file. 112 std::vector<std::vector<std::string>> LinkerOptions; 113 114 /// List of declared file names 115 std::vector<std::string> FileNames; 116 117 MCDwarfLineTableParams LTParams; 118 119 /// The set of function symbols for which a .thumb_func directive has 120 /// been seen. 121 // 122 // FIXME: We really would like this in target specific code rather than 123 // here. Maybe when the relocation stuff moves to target specific, 124 // this can go with it? The streamer would need some target specific 125 // refactoring too. 126 mutable SmallPtrSet<const MCSymbol *, 32> ThumbFuncs; 127 128 /// \brief The bundle alignment size currently set in the assembler. 129 /// 130 /// By default it's 0, which means bundling is disabled. 131 unsigned BundleAlignSize; 132 133 bool RelaxAll : 1; 134 bool SubsectionsViaSymbols : 1; 135 bool IncrementalLinkerCompatible : 1; 136 137 /// ELF specific e_header flags 138 // It would be good if there were an MCELFAssembler class to hold this. 139 // ELF header flags are used both by the integrated and standalone assemblers. 140 // Access to the flags is necessary in cases where assembler directives affect 141 // which flags to be set. 142 unsigned ELFHeaderEFlags; 143 144 /// Used to communicate Linker Optimization Hint information between 145 /// the Streamer and the .o writer 146 MCLOHContainer LOHContainer; 147 148 VersionMinInfoType VersionMinInfo; 149 150 /// Evaluate a fixup to a relocatable expression and the value which should be 151 /// placed into the fixup. 152 /// 153 /// \param Layout The layout to use for evaluation. 154 /// \param Fixup The fixup to evaluate. 155 /// \param DF The fragment the fixup is inside. 156 /// \param Target [out] On return, the relocatable expression the fixup 157 /// evaluates to. 158 /// \param Value [out] On return, the value of the fixup as currently laid 159 /// out. 160 /// \return Whether the fixup value was fully resolved. This is true if the 161 /// \p Value result is fixed, otherwise the value may change due to 162 /// relocation. 163 bool evaluateFixup(const MCAsmLayout &Layout, const MCFixup &Fixup, 164 const MCFragment *DF, MCValue &Target, 165 uint64_t &Value) const; 166 167 /// Check whether a fixup can be satisfied, or whether it needs to be relaxed 168 /// (increased in size, in order to hold its value correctly). 169 bool fixupNeedsRelaxation(const MCFixup &Fixup, const MCRelaxableFragment *DF, 170 const MCAsmLayout &Layout) const; 171 172 /// Check whether the given fragment needs relaxation. 173 bool fragmentNeedsRelaxation(const MCRelaxableFragment *IF, 174 const MCAsmLayout &Layout) const; 175 176 /// \brief Perform one layout iteration and return true if any offsets 177 /// were adjusted. 178 bool layoutOnce(MCAsmLayout &Layout); 179 180 /// \brief Perform one layout iteration of the given section and return true 181 /// if any offsets were adjusted. 182 bool layoutSectionOnce(MCAsmLayout &Layout, MCSection &Sec); 183 184 bool relaxInstruction(MCAsmLayout &Layout, MCRelaxableFragment &IF); 185 186 bool relaxLEB(MCAsmLayout &Layout, MCLEBFragment &IF); 187 188 bool relaxDwarfLineAddr(MCAsmLayout &Layout, MCDwarfLineAddrFragment &DF); 189 bool relaxDwarfCallFrameFragment(MCAsmLayout &Layout, 190 MCDwarfCallFrameFragment &DF); 191 bool relaxCVInlineLineTable(MCAsmLayout &Layout, 192 MCCVInlineLineTableFragment &DF); 193 bool relaxCVDefRange(MCAsmLayout &Layout, MCCVDefRangeFragment &DF); 194 195 /// finishLayout - Finalize a layout, including fragment lowering. 196 void finishLayout(MCAsmLayout &Layout); 197 198 std::tuple<MCValue, uint64_t, bool> 199 handleFixup(const MCAsmLayout &Layout, MCFragment &F, const MCFixup &Fixup); 200 201public: 202 /// Construct a new assembler instance. 203 // 204 // FIXME: How are we going to parameterize this? Two obvious options are stay 205 // concrete and require clients to pass in a target like object. The other 206 // option is to make this abstract, and have targets provide concrete 207 // implementations as we do with AsmParser. 208 MCAssembler(MCContext &Context, MCAsmBackend &Backend, 209 MCCodeEmitter &Emitter, MCObjectWriter &Writer); 210 MCAssembler(const MCAssembler &) = delete; 211 MCAssembler &operator=(const MCAssembler &) = delete; 212 ~MCAssembler(); 213 214 /// Compute the effective fragment size assuming it is laid out at the given 215 /// \p SectionAddress and \p FragmentOffset. 216 uint64_t computeFragmentSize(const MCAsmLayout &Layout, 217 const MCFragment &F) const; 218 219 /// Find the symbol which defines the atom containing the given symbol, or 220 /// null if there is no such symbol. 221 const MCSymbol *getAtom(const MCSymbol &S) const; 222 223 /// Check whether a particular symbol is visible to the linker and is required 224 /// in the symbol table, or whether it can be discarded by the assembler. This 225 /// also effects whether the assembler treats the label as potentially 226 /// defining a separate atom. 227 bool isSymbolLinkerVisible(const MCSymbol &SD) const; 228 229 /// Emit the section contents using the given object writer. 230 void writeSectionData(const MCSection *Section, 231 const MCAsmLayout &Layout) const; 232 233 /// Check whether a given symbol has been flagged with .thumb_func. 234 bool isThumbFunc(const MCSymbol *Func) const; 235 236 /// Flag a function symbol as the target of a .thumb_func directive. 237 void setIsThumbFunc(const MCSymbol *Func) { ThumbFuncs.insert(Func); } 238 239 /// ELF e_header flags 240 unsigned getELFHeaderEFlags() const { return ELFHeaderEFlags; } 241 void setELFHeaderEFlags(unsigned Flags) { ELFHeaderEFlags = Flags; } 242 243 /// MachO deployment target version information. 244 const VersionMinInfoType &getVersionMinInfo() const { return VersionMinInfo; } 245 void setVersionMinInfo(MCVersionMinType Kind, unsigned Major, unsigned Minor, 246 unsigned Update) { 247 VersionMinInfo.Kind = Kind; 248 VersionMinInfo.Major = Major; 249 VersionMinInfo.Minor = Minor; 250 VersionMinInfo.Update = Update; 251 } 252 253 /// Reuse an assembler instance 254 /// 255 void reset(); 256 257 MCContext &getContext() const { return Context; } 258 259 MCAsmBackend &getBackend() const { return Backend; } 260 261 MCCodeEmitter &getEmitter() const { return Emitter; } 262 263 MCObjectWriter &getWriter() const { return Writer; } 264 265 MCDwarfLineTableParams getDWARFLinetableParams() const { return LTParams; } 266 void setDWARFLinetableParams(MCDwarfLineTableParams P) { LTParams = P; } 267 268 /// Finish - Do final processing and write the object to the output stream. 269 /// \p Writer is used for custom object writer (as the MCJIT does), 270 /// if not specified it is automatically created from backend. 271 void Finish(); 272 273 // Layout all section and prepare them for emission. 274 void layout(MCAsmLayout &Layout); 275 276 // FIXME: This does not belong here. 277 bool getSubsectionsViaSymbols() const { return SubsectionsViaSymbols; } 278 void setSubsectionsViaSymbols(bool Value) { SubsectionsViaSymbols = Value; } 279 280 bool isIncrementalLinkerCompatible() const { 281 return IncrementalLinkerCompatible; 282 } 283 void setIncrementalLinkerCompatible(bool Value) { 284 IncrementalLinkerCompatible = Value; 285 } 286 287 bool getRelaxAll() const { return RelaxAll; } 288 void setRelaxAll(bool Value) { RelaxAll = Value; } 289 290 bool isBundlingEnabled() const { return BundleAlignSize != 0; } 291 292 unsigned getBundleAlignSize() const { return BundleAlignSize; } 293 294 void setBundleAlignSize(unsigned Size) { 295 assert((Size == 0 || !(Size & (Size - 1))) && 296 "Expect a power-of-two bundle align size"); 297 BundleAlignSize = Size; 298 } 299 300 /// \name Section List Access 301 /// @{ 302 303 iterator begin() { return Sections.begin(); } 304 const_iterator begin() const { return Sections.begin(); } 305 306 iterator end() { return Sections.end(); } 307 const_iterator end() const { return Sections.end(); } 308 309 size_t size() const { return Sections.size(); } 310 311 /// @} 312 /// \name Symbol List Access 313 /// @{ 314 symbol_iterator symbol_begin() { return Symbols.begin(); } 315 const_symbol_iterator symbol_begin() const { return Symbols.begin(); } 316 317 symbol_iterator symbol_end() { return Symbols.end(); } 318 const_symbol_iterator symbol_end() const { return Symbols.end(); } 319 320 symbol_range symbols() { return make_range(symbol_begin(), symbol_end()); } 321 const_symbol_range symbols() const { 322 return make_range(symbol_begin(), symbol_end()); 323 } 324 325 size_t symbol_size() const { return Symbols.size(); } 326 327 /// @} 328 /// \name Indirect Symbol List Access 329 /// @{ 330 331 // FIXME: This is a total hack, this should not be here. Once things are 332 // factored so that the streamer has direct access to the .o writer, it can 333 // disappear. 334 std::vector<IndirectSymbolData> &getIndirectSymbols() { 335 return IndirectSymbols; 336 } 337 338 indirect_symbol_iterator indirect_symbol_begin() { 339 return IndirectSymbols.begin(); 340 } 341 const_indirect_symbol_iterator indirect_symbol_begin() const { 342 return IndirectSymbols.begin(); 343 } 344 345 indirect_symbol_iterator indirect_symbol_end() { 346 return IndirectSymbols.end(); 347 } 348 const_indirect_symbol_iterator indirect_symbol_end() const { 349 return IndirectSymbols.end(); 350 } 351 352 size_t indirect_symbol_size() const { return IndirectSymbols.size(); } 353 354 /// @} 355 /// \name Linker Option List Access 356 /// @{ 357 358 std::vector<std::vector<std::string>> &getLinkerOptions() { 359 return LinkerOptions; 360 } 361 362 /// @} 363 /// \name Data Region List Access 364 /// @{ 365 366 // FIXME: This is a total hack, this should not be here. Once things are 367 // factored so that the streamer has direct access to the .o writer, it can 368 // disappear. 369 std::vector<DataRegionData> &getDataRegions() { return DataRegions; } 370 371 data_region_iterator data_region_begin() { return DataRegions.begin(); } 372 const_data_region_iterator data_region_begin() const { 373 return DataRegions.begin(); 374 } 375 376 data_region_iterator data_region_end() { return DataRegions.end(); } 377 const_data_region_iterator data_region_end() const { 378 return DataRegions.end(); 379 } 380 381 size_t data_region_size() const { return DataRegions.size(); } 382 383 /// @} 384 /// \name Data Region List Access 385 /// @{ 386 387 // FIXME: This is a total hack, this should not be here. Once things are 388 // factored so that the streamer has direct access to the .o writer, it can 389 // disappear. 390 MCLOHContainer &getLOHContainer() { return LOHContainer; } 391 const MCLOHContainer &getLOHContainer() const { 392 return const_cast<MCAssembler *>(this)->getLOHContainer(); 393 } 394 /// @} 395 /// \name Backend Data Access 396 /// @{ 397 398 bool registerSection(MCSection &Section); 399 400 void registerSymbol(const MCSymbol &Symbol, bool *Created = nullptr); 401 402 ArrayRef<std::string> getFileNames() { return FileNames; } 403 404 void addFileName(StringRef FileName) { 405 if (!is_contained(FileNames, FileName)) 406 FileNames.push_back(FileName); 407 } 408 409 /// \brief Write the necessary bundle padding to the given object writer. 410 /// Expects a fragment \p F containing instructions and its size \p FSize. 411 void writeFragmentPadding(const MCFragment &F, uint64_t FSize, 412 MCObjectWriter *OW) const; 413 414 /// @} 415 416 void dump() const; 417}; 418 419/// \brief Compute the amount of padding required before the fragment \p F to 420/// obey bundling restrictions, where \p FOffset is the fragment's offset in 421/// its section and \p FSize is the fragment's size. 422uint64_t computeBundlePadding(const MCAssembler &Assembler, const MCFragment *F, 423 uint64_t FOffset, uint64_t FSize); 424 425} // end namespace llvm 426 427#endif // LLVM_MC_MCASSEMBLER_H 428