MCAsmStreamer.cpp revision 12e555c36ce11c39ce15cd0b27bf7b02a068beb2
1//===- lib/MC/MCAsmStreamer.cpp - Text Assembly Output --------------------===// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9 10#include "llvm/MC/MCStreamer.h" 11#include "llvm/MC/MCAsmInfo.h" 12#include "llvm/MC/MCCodeEmitter.h" 13#include "llvm/MC/MCContext.h" 14#include "llvm/MC/MCExpr.h" 15#include "llvm/MC/MCInst.h" 16#include "llvm/MC/MCInstPrinter.h" 17#include "llvm/MC/MCSectionMachO.h" 18#include "llvm/MC/MCSymbol.h" 19#include "llvm/ADT/SmallString.h" 20#include "llvm/ADT/Twine.h" 21#include "llvm/Support/ErrorHandling.h" 22#include "llvm/Support/MathExtras.h" 23#include "llvm/Support/Format.h" 24#include "llvm/Support/FormattedStream.h" 25using namespace llvm; 26 27namespace { 28 29class MCAsmStreamer : public MCStreamer { 30 formatted_raw_ostream &OS; 31 const MCAsmInfo &MAI; 32 bool IsLittleEndian, IsVerboseAsm; 33 MCInstPrinter *InstPrinter; 34 MCCodeEmitter *Emitter; 35 36 SmallString<128> CommentToEmit; 37 raw_svector_ostream CommentStream; 38public: 39 MCAsmStreamer(MCContext &Context, formatted_raw_ostream &os, 40 const MCAsmInfo &mai, 41 bool isLittleEndian, bool isVerboseAsm, MCInstPrinter *printer, 42 MCCodeEmitter *emitter) 43 : MCStreamer(Context), OS(os), MAI(mai), IsLittleEndian(isLittleEndian), 44 IsVerboseAsm(isVerboseAsm), InstPrinter(printer), Emitter(emitter), 45 CommentStream(CommentToEmit) {} 46 ~MCAsmStreamer() {} 47 48 bool isLittleEndian() const { return IsLittleEndian; } 49 50 51 inline void EmitEOL() { 52 // If we don't have any comments, just emit a \n. 53 if (!IsVerboseAsm) { 54 OS << '\n'; 55 return; 56 } 57 EmitCommentsAndEOL(); 58 } 59 void EmitCommentsAndEOL(); 60 61 /// AddComment - Add a comment that can be emitted to the generated .s 62 /// file if applicable as a QoI issue to make the output of the compiler 63 /// more readable. This only affects the MCAsmStreamer, and only when 64 /// verbose assembly output is enabled. 65 virtual void AddComment(const Twine &T); 66 67 /// GetCommentOS - Return a raw_ostream that comments can be written to. 68 /// Unlike AddComment, you are required to terminate comments with \n if you 69 /// use this method. 70 virtual raw_ostream &GetCommentOS() { 71 if (!IsVerboseAsm) 72 return nulls(); // Discard comments unless in verbose asm mode. 73 return CommentStream; 74 } 75 76 /// AddBlankLine - Emit a blank line to a .s file to pretty it up. 77 virtual void AddBlankLine() { 78 EmitEOL(); 79 } 80 81 /// @name MCStreamer Interface 82 /// @{ 83 84 virtual void SwitchSection(const MCSection *Section); 85 86 virtual void EmitLabel(MCSymbol *Symbol); 87 88 virtual void EmitAssemblerFlag(AssemblerFlag Flag); 89 90 virtual void EmitAssignment(MCSymbol *Symbol, const MCExpr *Value); 91 92 virtual void EmitSymbolAttribute(MCSymbol *Symbol, SymbolAttr Attribute); 93 94 virtual void EmitSymbolDesc(MCSymbol *Symbol, unsigned DescValue); 95 96 virtual void EmitCommonSymbol(MCSymbol *Symbol, unsigned Size, 97 unsigned ByteAlignment); 98 99 virtual void EmitZerofill(const MCSection *Section, MCSymbol *Symbol = 0, 100 unsigned Size = 0, unsigned ByteAlignment = 0); 101 102 virtual void EmitBytes(StringRef Data, unsigned AddrSpace); 103 104 virtual void EmitValue(const MCExpr *Value, unsigned Size,unsigned AddrSpace); 105 virtual void EmitIntValue(uint64_t Value, unsigned Size, unsigned AddrSpace); 106 107 virtual void EmitFill(uint64_t NumBytes, uint8_t FillValue, 108 unsigned AddrSpace); 109 110 virtual void EmitValueToAlignment(unsigned ByteAlignment, int64_t Value = 0, 111 unsigned ValueSize = 1, 112 unsigned MaxBytesToEmit = 0); 113 114 virtual void EmitValueToOffset(const MCExpr *Offset, 115 unsigned char Value = 0); 116 117 virtual void EmitInstruction(const MCInst &Inst); 118 119 virtual void Finish(); 120 121 /// @} 122}; 123 124} // end anonymous namespace. 125 126/// AddComment - Add a comment that can be emitted to the generated .s 127/// file if applicable as a QoI issue to make the output of the compiler 128/// more readable. This only affects the MCAsmStreamer, and only when 129/// verbose assembly output is enabled. 130void MCAsmStreamer::AddComment(const Twine &T) { 131 if (!IsVerboseAsm) return; 132 133 // Make sure that CommentStream is flushed. 134 CommentStream.flush(); 135 136 T.toVector(CommentToEmit); 137 // Each comment goes on its own line. 138 CommentToEmit.push_back('\n'); 139 140 // Tell the comment stream that the vector changed underneath it. 141 CommentStream.resync(); 142} 143 144void MCAsmStreamer::EmitCommentsAndEOL() { 145 if (CommentToEmit.empty() && CommentStream.GetNumBytesInBuffer() == 0) { 146 OS << '\n'; 147 return; 148 } 149 150 CommentStream.flush(); 151 StringRef Comments = CommentToEmit.str(); 152 153 assert(Comments.back() == '\n' && 154 "Comment array not newline terminated"); 155 do { 156 // Emit a line of comments. 157 OS.PadToColumn(MAI.getCommentColumn()); 158 size_t Position = Comments.find('\n'); 159 OS << MAI.getCommentString() << ' ' << Comments.substr(0, Position) << '\n'; 160 161 Comments = Comments.substr(Position+1); 162 } while (!Comments.empty()); 163 164 CommentToEmit.clear(); 165 // Tell the comment stream that the vector changed underneath it. 166 CommentStream.resync(); 167} 168 169 170static inline int64_t truncateToSize(int64_t Value, unsigned Bytes) { 171 assert(Bytes && "Invalid size!"); 172 return Value & ((uint64_t) (int64_t) -1 >> (64 - Bytes * 8)); 173} 174 175static inline const MCExpr *truncateToSize(const MCExpr *Value, 176 unsigned Bytes) { 177 // FIXME: Do we really need this routine? 178 return Value; 179} 180 181void MCAsmStreamer::SwitchSection(const MCSection *Section) { 182 assert(Section && "Cannot switch to a null section!"); 183 if (Section != CurSection) { 184 CurSection = Section; 185 Section->PrintSwitchToSection(MAI, OS); 186 } 187} 188 189void MCAsmStreamer::EmitLabel(MCSymbol *Symbol) { 190 assert(Symbol->isUndefined() && "Cannot define a symbol twice!"); 191 assert(CurSection && "Cannot emit before setting section!"); 192 193 OS << *Symbol << ":"; 194 EmitEOL(); 195 Symbol->setSection(*CurSection); 196} 197 198void MCAsmStreamer::EmitAssemblerFlag(AssemblerFlag Flag) { 199 switch (Flag) { 200 default: assert(0 && "Invalid flag!"); 201 case SubsectionsViaSymbols: OS << ".subsections_via_symbols"; break; 202 } 203 EmitEOL(); 204} 205 206void MCAsmStreamer::EmitAssignment(MCSymbol *Symbol, const MCExpr *Value) { 207 // Only absolute symbols can be redefined. 208 assert((Symbol->isUndefined() || Symbol->isAbsolute()) && 209 "Cannot define a symbol twice!"); 210 211 OS << *Symbol << " = " << *Value; 212 EmitEOL(); 213 214 // FIXME: Lift context changes into super class. 215 // FIXME: Set associated section. 216 Symbol->setValue(Value); 217} 218 219void MCAsmStreamer::EmitSymbolAttribute(MCSymbol *Symbol, 220 SymbolAttr Attribute) { 221 switch (Attribute) { 222 case Global: OS << MAI.getGlobalDirective(); break; // .globl 223 case Hidden: OS << ".hidden "; break; 224 case IndirectSymbol: OS << ".indirect_symbol "; break; 225 case Internal: OS << ".internal "; break; 226 case LazyReference: OS << ".lazy_reference "; break; 227 case NoDeadStrip: OS << ".no_dead_strip "; break; 228 case PrivateExtern: OS << ".private_extern "; break; 229 case Protected: OS << ".protected "; break; 230 case Reference: OS << ".reference "; break; 231 case Weak: OS << ".weak "; break; 232 case WeakDefinition: OS << ".weak_definition "; break; 233 case WeakReference: OS << ".weak_reference "; break; 234 } 235 236 OS << *Symbol; 237 EmitEOL(); 238} 239 240void MCAsmStreamer::EmitSymbolDesc(MCSymbol *Symbol, unsigned DescValue) { 241 OS << ".desc" << ' ' << *Symbol << ',' << DescValue; 242 EmitEOL(); 243} 244 245void MCAsmStreamer::EmitCommonSymbol(MCSymbol *Symbol, unsigned Size, 246 unsigned ByteAlignment) { 247 OS << MAI.getCOMMDirective() << *Symbol << ',' << Size; 248 if (ByteAlignment != 0 && MAI.getCOMMDirectiveTakesAlignment()) { 249 if (MAI.getAlignmentIsInBytes()) 250 OS << ',' << ByteAlignment; 251 else 252 OS << ',' << Log2_32(ByteAlignment); 253 } 254 EmitEOL(); 255} 256 257void MCAsmStreamer::EmitZerofill(const MCSection *Section, MCSymbol *Symbol, 258 unsigned Size, unsigned ByteAlignment) { 259 // Note: a .zerofill directive does not switch sections. 260 OS << ".zerofill "; 261 262 // This is a mach-o specific directive. 263 const MCSectionMachO *MOSection = ((const MCSectionMachO*)Section); 264 OS << MOSection->getSegmentName() << "," << MOSection->getSectionName(); 265 266 if (Symbol != NULL) { 267 OS << ',' << *Symbol << ',' << Size; 268 if (ByteAlignment != 0) 269 OS << ',' << Log2_32(ByteAlignment); 270 } 271 EmitEOL(); 272} 273 274static inline char toOctal(int X) { return (X&7)+'0'; } 275 276void MCAsmStreamer::EmitBytes(StringRef Data, unsigned AddrSpace) { 277 assert(CurSection && "Cannot emit contents before setting section!"); 278 if (Data.empty()) return; 279 280 if (Data.size() == 1) { 281 OS << MAI.getData8bitsDirective(AddrSpace); 282 OS << (unsigned)(unsigned char)Data[0]; 283 EmitEOL(); 284 return; 285 } 286 287 // If the data ends with 0 and the target supports .asciz, use it, otherwise 288 // use .ascii 289 if (MAI.getAscizDirective() && Data.back() == 0) { 290 OS << MAI.getAscizDirective(); 291 Data = Data.substr(0, Data.size()-1); 292 } else { 293 OS << MAI.getAsciiDirective(); 294 } 295 296 OS << " \""; 297 for (unsigned i = 0, e = Data.size(); i != e; ++i) { 298 unsigned char C = Data[i]; 299 if (C == '"' || C == '\\') { 300 OS << '\\' << (char)C; 301 continue; 302 } 303 304 if (isprint((unsigned char)C)) { 305 OS << (char)C; 306 continue; 307 } 308 309 switch (C) { 310 case '\b': OS << "\\b"; break; 311 case '\f': OS << "\\f"; break; 312 case '\n': OS << "\\n"; break; 313 case '\r': OS << "\\r"; break; 314 case '\t': OS << "\\t"; break; 315 default: 316 OS << '\\'; 317 OS << toOctal(C >> 6); 318 OS << toOctal(C >> 3); 319 OS << toOctal(C >> 0); 320 break; 321 } 322 } 323 OS << '"'; 324 EmitEOL(); 325} 326 327/// EmitIntValue - Special case of EmitValue that avoids the client having 328/// to pass in a MCExpr for constant integers. 329void MCAsmStreamer::EmitIntValue(uint64_t Value, unsigned Size, 330 unsigned AddrSpace) { 331 assert(CurSection && "Cannot emit contents before setting section!"); 332 const char *Directive = 0; 333 switch (Size) { 334 default: break; 335 case 1: Directive = MAI.getData8bitsDirective(AddrSpace); break; 336 case 2: Directive = MAI.getData16bitsDirective(AddrSpace); break; 337 case 4: Directive = MAI.getData32bitsDirective(AddrSpace); break; 338 case 8: 339 Directive = MAI.getData64bitsDirective(AddrSpace); 340 // If the target doesn't support 64-bit data, emit as two 32-bit halves. 341 if (Directive) break; 342 if (isLittleEndian()) { 343 EmitIntValue((uint32_t)(Value >> 0 ), 4, AddrSpace); 344 EmitIntValue((uint32_t)(Value >> 32), 4, AddrSpace); 345 } else { 346 EmitIntValue((uint32_t)(Value >> 32), 4, AddrSpace); 347 EmitIntValue((uint32_t)(Value >> 0 ), 4, AddrSpace); 348 } 349 return; 350 } 351 352 assert(Directive && "Invalid size for machine code value!"); 353 OS << Directive << truncateToSize(Value, Size); 354 EmitEOL(); 355} 356 357void MCAsmStreamer::EmitValue(const MCExpr *Value, unsigned Size, 358 unsigned AddrSpace) { 359 assert(CurSection && "Cannot emit contents before setting section!"); 360 const char *Directive = 0; 361 switch (Size) { 362 default: break; 363 case 1: Directive = MAI.getData8bitsDirective(AddrSpace); break; 364 case 2: Directive = MAI.getData16bitsDirective(AddrSpace); break; 365 case 4: Directive = MAI.getData32bitsDirective(AddrSpace); break; 366 case 8: Directive = MAI.getData64bitsDirective(AddrSpace); break; 367 } 368 369 assert(Directive && "Invalid size for machine code value!"); 370 OS << Directive << *truncateToSize(Value, Size); 371 EmitEOL(); 372} 373 374/// EmitFill - Emit NumBytes bytes worth of the value specified by 375/// FillValue. This implements directives such as '.space'. 376void MCAsmStreamer::EmitFill(uint64_t NumBytes, uint8_t FillValue, 377 unsigned AddrSpace) { 378 if (NumBytes == 0) return; 379 380 if (AddrSpace == 0) 381 if (const char *ZeroDirective = MAI.getZeroDirective()) { 382 OS << ZeroDirective << NumBytes; 383 if (FillValue != 0) 384 OS << ',' << (int)FillValue; 385 EmitEOL(); 386 return; 387 } 388 389 // Emit a byte at a time. 390 MCStreamer::EmitFill(NumBytes, FillValue, AddrSpace); 391} 392 393void MCAsmStreamer::EmitValueToAlignment(unsigned ByteAlignment, int64_t Value, 394 unsigned ValueSize, 395 unsigned MaxBytesToEmit) { 396 // Some assemblers don't support non-power of two alignments, so we always 397 // emit alignments as a power of two if possible. 398 if (isPowerOf2_32(ByteAlignment)) { 399 switch (ValueSize) { 400 default: llvm_unreachable("Invalid size for machine code value!"); 401 case 1: OS << MAI.getAlignDirective(); break; 402 // FIXME: use MAI for this! 403 case 2: OS << ".p2alignw "; break; 404 case 4: OS << ".p2alignl "; break; 405 case 8: llvm_unreachable("Unsupported alignment size!"); 406 } 407 408 if (MAI.getAlignmentIsInBytes()) 409 OS << ByteAlignment; 410 else 411 OS << Log2_32(ByteAlignment); 412 413 if (Value || MaxBytesToEmit) { 414 OS << ", 0x"; 415 OS.write_hex(truncateToSize(Value, ValueSize)); 416 417 if (MaxBytesToEmit) 418 OS << ", " << MaxBytesToEmit; 419 } 420 EmitEOL(); 421 return; 422 } 423 424 // Non-power of two alignment. This is not widely supported by assemblers. 425 // FIXME: Parameterize this based on MAI. 426 switch (ValueSize) { 427 default: llvm_unreachable("Invalid size for machine code value!"); 428 case 1: OS << ".balign"; break; 429 case 2: OS << ".balignw"; break; 430 case 4: OS << ".balignl"; break; 431 case 8: llvm_unreachable("Unsupported alignment size!"); 432 } 433 434 OS << ' ' << ByteAlignment; 435 OS << ", " << truncateToSize(Value, ValueSize); 436 if (MaxBytesToEmit) 437 OS << ", " << MaxBytesToEmit; 438 EmitEOL(); 439} 440 441void MCAsmStreamer::EmitValueToOffset(const MCExpr *Offset, 442 unsigned char Value) { 443 // FIXME: Verify that Offset is associated with the current section. 444 OS << ".org " << *Offset << ", " << (unsigned) Value; 445 EmitEOL(); 446} 447 448void MCAsmStreamer::EmitInstruction(const MCInst &Inst) { 449 assert(CurSection && "Cannot emit contents before setting section!"); 450 451 // If we have an AsmPrinter, use that to print. 452 if (InstPrinter) { 453 InstPrinter->printInst(&Inst); 454 EmitEOL(); 455 456 // Show the encoding if we have a code emitter. 457 if (Emitter) { 458 SmallString<256> Code; 459 raw_svector_ostream VecOS(Code); 460 Emitter->EncodeInstruction(Inst, VecOS); 461 VecOS.flush(); 462 463 OS.indent(20); 464 OS << " # encoding: ["; 465 for (unsigned i = 0, e = Code.size(); i != e; ++i) { 466 if (i) 467 OS << ','; 468 OS << format("%#04x", uint8_t(Code[i])); 469 } 470 OS << "]\n"; 471 } 472 473 return; 474 } 475 476 // Otherwise fall back to a structural printing for now. Eventually we should 477 // always have access to the target specific printer. 478 Inst.print(OS, &MAI); 479 EmitEOL(); 480} 481 482void MCAsmStreamer::Finish() { 483 OS.flush(); 484} 485 486MCStreamer *llvm::createAsmStreamer(MCContext &Context, 487 formatted_raw_ostream &OS, 488 const MCAsmInfo &MAI, bool isLittleEndian, 489 bool isVerboseAsm, MCInstPrinter *IP, 490 MCCodeEmitter *CE) { 491 return new MCAsmStreamer(Context, OS, MAI, isLittleEndian, isVerboseAsm, 492 IP, CE); 493} 494