SemaStmtAsm.cpp revision ef3f6ff4ece061dc3e905d656126f09883c7ae2e
1//===--- SemaStmtAsm.cpp - Semantic Analysis for Asm Statements -----------===// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9// 10// This file implements semantic analysis for inline asm statements. 11// 12//===----------------------------------------------------------------------===// 13 14#include "clang/Sema/SemaInternal.h" 15#include "clang/Sema/Scope.h" 16#include "clang/Sema/ScopeInfo.h" 17#include "clang/Sema/Initialization.h" 18#include "clang/Sema/Lookup.h" 19#include "clang/AST/TypeLoc.h" 20#include "clang/Lex/Preprocessor.h" 21#include "clang/Basic/TargetInfo.h" 22#include "llvm/ADT/ArrayRef.h" 23#include "llvm/ADT/BitVector.h" 24#include "llvm/ADT/SmallString.h" 25#include "llvm/MC/MCAsmInfo.h" 26#include "llvm/MC/MCContext.h" 27#include "llvm/MC/MCExpr.h" 28#include "llvm/MC/MCInst.h" 29#include "llvm/MC/MCInstPrinter.h" 30#include "llvm/MC/MCInstrInfo.h" 31#include "llvm/MC/MCObjectFileInfo.h" 32#include "llvm/MC/MCRegisterInfo.h" 33#include "llvm/MC/MCStreamer.h" 34#include "llvm/MC/MCSubtargetInfo.h" 35#include "llvm/MC/MCSymbol.h" 36#include "llvm/MC/MCTargetAsmParser.h" 37#include "llvm/MC/MCParser/MCAsmLexer.h" 38#include "llvm/MC/MCParser/MCAsmParser.h" 39#include "llvm/MC/MCParser/MCParsedAsmOperand.h" 40#include "llvm/Support/SourceMgr.h" 41#include "llvm/Support/TargetRegistry.h" 42#include "llvm/Support/TargetSelect.h" 43using namespace clang; 44using namespace sema; 45 46/// CheckAsmLValue - GNU C has an extremely ugly extension whereby they silently 47/// ignore "noop" casts in places where an lvalue is required by an inline asm. 48/// We emulate this behavior when -fheinous-gnu-extensions is specified, but 49/// provide a strong guidance to not use it. 50/// 51/// This method checks to see if the argument is an acceptable l-value and 52/// returns false if it is a case we can handle. 53static bool CheckAsmLValue(const Expr *E, Sema &S) { 54 // Type dependent expressions will be checked during instantiation. 55 if (E->isTypeDependent()) 56 return false; 57 58 if (E->isLValue()) 59 return false; // Cool, this is an lvalue. 60 61 // Okay, this is not an lvalue, but perhaps it is the result of a cast that we 62 // are supposed to allow. 63 const Expr *E2 = E->IgnoreParenNoopCasts(S.Context); 64 if (E != E2 && E2->isLValue()) { 65 if (!S.getLangOpts().HeinousExtensions) 66 S.Diag(E2->getLocStart(), diag::err_invalid_asm_cast_lvalue) 67 << E->getSourceRange(); 68 else 69 S.Diag(E2->getLocStart(), diag::warn_invalid_asm_cast_lvalue) 70 << E->getSourceRange(); 71 // Accept, even if we emitted an error diagnostic. 72 return false; 73 } 74 75 // None of the above, just randomly invalid non-lvalue. 76 return true; 77} 78 79/// isOperandMentioned - Return true if the specified operand # is mentioned 80/// anywhere in the decomposed asm string. 81static bool isOperandMentioned(unsigned OpNo, 82 ArrayRef<GCCAsmStmt::AsmStringPiece> AsmStrPieces) { 83 for (unsigned p = 0, e = AsmStrPieces.size(); p != e; ++p) { 84 const GCCAsmStmt::AsmStringPiece &Piece = AsmStrPieces[p]; 85 if (!Piece.isOperand()) continue; 86 87 // If this is a reference to the input and if the input was the smaller 88 // one, then we have to reject this asm. 89 if (Piece.getOperandNo() == OpNo) 90 return true; 91 } 92 return false; 93} 94 95StmtResult Sema::ActOnGCCAsmStmt(SourceLocation AsmLoc, bool IsSimple, 96 bool IsVolatile, unsigned NumOutputs, 97 unsigned NumInputs, IdentifierInfo **Names, 98 MultiExprArg constraints, MultiExprArg exprs, 99 Expr *asmString, MultiExprArg clobbers, 100 SourceLocation RParenLoc) { 101 unsigned NumClobbers = clobbers.size(); 102 StringLiteral **Constraints = 103 reinterpret_cast<StringLiteral**>(constraints.data()); 104 Expr **Exprs = exprs.data(); 105 StringLiteral *AsmString = cast<StringLiteral>(asmString); 106 StringLiteral **Clobbers = reinterpret_cast<StringLiteral**>(clobbers.data()); 107 108 SmallVector<TargetInfo::ConstraintInfo, 4> OutputConstraintInfos; 109 110 // The parser verifies that there is a string literal here. 111 if (!AsmString->isAscii()) 112 return StmtError(Diag(AsmString->getLocStart(),diag::err_asm_wide_character) 113 << AsmString->getSourceRange()); 114 115 for (unsigned i = 0; i != NumOutputs; i++) { 116 StringLiteral *Literal = Constraints[i]; 117 if (!Literal->isAscii()) 118 return StmtError(Diag(Literal->getLocStart(),diag::err_asm_wide_character) 119 << Literal->getSourceRange()); 120 121 StringRef OutputName; 122 if (Names[i]) 123 OutputName = Names[i]->getName(); 124 125 TargetInfo::ConstraintInfo Info(Literal->getString(), OutputName); 126 if (!Context.getTargetInfo().validateOutputConstraint(Info)) 127 return StmtError(Diag(Literal->getLocStart(), 128 diag::err_asm_invalid_output_constraint) 129 << Info.getConstraintStr()); 130 131 // Check that the output exprs are valid lvalues. 132 Expr *OutputExpr = Exprs[i]; 133 if (CheckAsmLValue(OutputExpr, *this)) { 134 return StmtError(Diag(OutputExpr->getLocStart(), 135 diag::err_asm_invalid_lvalue_in_output) 136 << OutputExpr->getSourceRange()); 137 } 138 139 OutputConstraintInfos.push_back(Info); 140 } 141 142 SmallVector<TargetInfo::ConstraintInfo, 4> InputConstraintInfos; 143 144 for (unsigned i = NumOutputs, e = NumOutputs + NumInputs; i != e; i++) { 145 StringLiteral *Literal = Constraints[i]; 146 if (!Literal->isAscii()) 147 return StmtError(Diag(Literal->getLocStart(),diag::err_asm_wide_character) 148 << Literal->getSourceRange()); 149 150 StringRef InputName; 151 if (Names[i]) 152 InputName = Names[i]->getName(); 153 154 TargetInfo::ConstraintInfo Info(Literal->getString(), InputName); 155 if (!Context.getTargetInfo().validateInputConstraint(OutputConstraintInfos.data(), 156 NumOutputs, Info)) { 157 return StmtError(Diag(Literal->getLocStart(), 158 diag::err_asm_invalid_input_constraint) 159 << Info.getConstraintStr()); 160 } 161 162 Expr *InputExpr = Exprs[i]; 163 164 // Only allow void types for memory constraints. 165 if (Info.allowsMemory() && !Info.allowsRegister()) { 166 if (CheckAsmLValue(InputExpr, *this)) 167 return StmtError(Diag(InputExpr->getLocStart(), 168 diag::err_asm_invalid_lvalue_in_input) 169 << Info.getConstraintStr() 170 << InputExpr->getSourceRange()); 171 } 172 173 if (Info.allowsRegister()) { 174 if (InputExpr->getType()->isVoidType()) { 175 return StmtError(Diag(InputExpr->getLocStart(), 176 diag::err_asm_invalid_type_in_input) 177 << InputExpr->getType() << Info.getConstraintStr() 178 << InputExpr->getSourceRange()); 179 } 180 } 181 182 ExprResult Result = DefaultFunctionArrayLvalueConversion(Exprs[i]); 183 if (Result.isInvalid()) 184 return StmtError(); 185 186 Exprs[i] = Result.take(); 187 InputConstraintInfos.push_back(Info); 188 } 189 190 // Check that the clobbers are valid. 191 for (unsigned i = 0; i != NumClobbers; i++) { 192 StringLiteral *Literal = Clobbers[i]; 193 if (!Literal->isAscii()) 194 return StmtError(Diag(Literal->getLocStart(),diag::err_asm_wide_character) 195 << Literal->getSourceRange()); 196 197 StringRef Clobber = Literal->getString(); 198 199 if (!Context.getTargetInfo().isValidClobber(Clobber)) 200 return StmtError(Diag(Literal->getLocStart(), 201 diag::err_asm_unknown_register_name) << Clobber); 202 } 203 204 GCCAsmStmt *NS = 205 new (Context) GCCAsmStmt(Context, AsmLoc, IsSimple, IsVolatile, NumOutputs, 206 NumInputs, Names, Constraints, Exprs, AsmString, 207 NumClobbers, Clobbers, RParenLoc); 208 // Validate the asm string, ensuring it makes sense given the operands we 209 // have. 210 SmallVector<GCCAsmStmt::AsmStringPiece, 8> Pieces; 211 unsigned DiagOffs; 212 if (unsigned DiagID = NS->AnalyzeAsmString(Pieces, Context, DiagOffs)) { 213 Diag(getLocationOfStringLiteralByte(AsmString, DiagOffs), DiagID) 214 << AsmString->getSourceRange(); 215 return StmtError(); 216 } 217 218 // Validate tied input operands for type mismatches. 219 for (unsigned i = 0, e = InputConstraintInfos.size(); i != e; ++i) { 220 TargetInfo::ConstraintInfo &Info = InputConstraintInfos[i]; 221 222 // If this is a tied constraint, verify that the output and input have 223 // either exactly the same type, or that they are int/ptr operands with the 224 // same size (int/long, int*/long, are ok etc). 225 if (!Info.hasTiedOperand()) continue; 226 227 unsigned TiedTo = Info.getTiedOperand(); 228 unsigned InputOpNo = i+NumOutputs; 229 Expr *OutputExpr = Exprs[TiedTo]; 230 Expr *InputExpr = Exprs[InputOpNo]; 231 232 if (OutputExpr->isTypeDependent() || InputExpr->isTypeDependent()) 233 continue; 234 235 QualType InTy = InputExpr->getType(); 236 QualType OutTy = OutputExpr->getType(); 237 if (Context.hasSameType(InTy, OutTy)) 238 continue; // All types can be tied to themselves. 239 240 // Decide if the input and output are in the same domain (integer/ptr or 241 // floating point. 242 enum AsmDomain { 243 AD_Int, AD_FP, AD_Other 244 } InputDomain, OutputDomain; 245 246 if (InTy->isIntegerType() || InTy->isPointerType()) 247 InputDomain = AD_Int; 248 else if (InTy->isRealFloatingType()) 249 InputDomain = AD_FP; 250 else 251 InputDomain = AD_Other; 252 253 if (OutTy->isIntegerType() || OutTy->isPointerType()) 254 OutputDomain = AD_Int; 255 else if (OutTy->isRealFloatingType()) 256 OutputDomain = AD_FP; 257 else 258 OutputDomain = AD_Other; 259 260 // They are ok if they are the same size and in the same domain. This 261 // allows tying things like: 262 // void* to int* 263 // void* to int if they are the same size. 264 // double to long double if they are the same size. 265 // 266 uint64_t OutSize = Context.getTypeSize(OutTy); 267 uint64_t InSize = Context.getTypeSize(InTy); 268 if (OutSize == InSize && InputDomain == OutputDomain && 269 InputDomain != AD_Other) 270 continue; 271 272 // If the smaller input/output operand is not mentioned in the asm string, 273 // then we can promote the smaller one to a larger input and the asm string 274 // won't notice. 275 bool SmallerValueMentioned = false; 276 277 // If this is a reference to the input and if the input was the smaller 278 // one, then we have to reject this asm. 279 if (isOperandMentioned(InputOpNo, Pieces)) { 280 // This is a use in the asm string of the smaller operand. Since we 281 // codegen this by promoting to a wider value, the asm will get printed 282 // "wrong". 283 SmallerValueMentioned |= InSize < OutSize; 284 } 285 if (isOperandMentioned(TiedTo, Pieces)) { 286 // If this is a reference to the output, and if the output is the larger 287 // value, then it's ok because we'll promote the input to the larger type. 288 SmallerValueMentioned |= OutSize < InSize; 289 } 290 291 // If the smaller value wasn't mentioned in the asm string, and if the 292 // output was a register, just extend the shorter one to the size of the 293 // larger one. 294 if (!SmallerValueMentioned && InputDomain != AD_Other && 295 OutputConstraintInfos[TiedTo].allowsRegister()) 296 continue; 297 298 // Either both of the operands were mentioned or the smaller one was 299 // mentioned. One more special case that we'll allow: if the tied input is 300 // integer, unmentioned, and is a constant, then we'll allow truncating it 301 // down to the size of the destination. 302 if (InputDomain == AD_Int && OutputDomain == AD_Int && 303 !isOperandMentioned(InputOpNo, Pieces) && 304 InputExpr->isEvaluatable(Context)) { 305 CastKind castKind = 306 (OutTy->isBooleanType() ? CK_IntegralToBoolean : CK_IntegralCast); 307 InputExpr = ImpCastExprToType(InputExpr, OutTy, castKind).take(); 308 Exprs[InputOpNo] = InputExpr; 309 NS->setInputExpr(i, InputExpr); 310 continue; 311 } 312 313 Diag(InputExpr->getLocStart(), 314 diag::err_asm_tying_incompatible_types) 315 << InTy << OutTy << OutputExpr->getSourceRange() 316 << InputExpr->getSourceRange(); 317 return StmtError(); 318 } 319 320 return Owned(NS); 321} 322 323// isMSAsmKeyword - Return true if this is an MS-style inline asm keyword. These 324// require special handling. 325static bool isMSAsmKeyword(StringRef Name) { 326 bool Ret = llvm::StringSwitch<bool>(Name) 327 .Cases("EVEN", "ALIGN", true) // Alignment directives. 328 .Cases("LENGTH", "SIZE", "TYPE", true) // Type and variable sizes. 329 .Case("_emit", true) // _emit Pseudoinstruction. 330 .Default(false); 331 return Ret; 332} 333 334// getIdentifierInfo - Given a Name and a range of tokens, find the associated 335// IdentifierInfo*. 336static IdentifierInfo *getIdentifierInfo(StringRef Name, 337 ArrayRef<Token> AsmToks, 338 unsigned Begin, unsigned End) { 339 for (unsigned i = Begin; i <= End; ++i) { 340 IdentifierInfo *II = AsmToks[i].getIdentifierInfo(); 341 if (II && II->getName() == Name) 342 return II; 343 } 344 return 0; 345} 346 347// getSpelling - Get the spelling of the AsmTok token. 348static StringRef getSpelling(Sema &SemaRef, Token AsmTok) { 349 StringRef Asm; 350 SmallString<512> TokenBuf; 351 TokenBuf.resize(512); 352 bool StringInvalid = false; 353 Asm = SemaRef.PP.getSpelling(AsmTok, TokenBuf, &StringInvalid); 354 assert (!StringInvalid && "Expected valid string!"); 355 return Asm; 356} 357 358// Determine if we should bail on this MSAsm instruction. 359static bool bailOnMSAsm(std::vector<StringRef> Piece) { 360 for (unsigned i = 0, e = Piece.size(); i != e; ++i) 361 if (isMSAsmKeyword(Piece[i])) 362 return true; 363 return false; 364} 365 366// Determine if we should bail on this MSAsm block. 367static bool bailOnMSAsm(std::vector<std::vector<StringRef> > Pieces) { 368 for (unsigned i = 0, e = Pieces.size(); i != e; ++i) 369 if (bailOnMSAsm(Pieces[i])) 370 return true; 371 return false; 372} 373 374// Determine if this is a simple MSAsm instruction. 375static bool isSimpleMSAsm(std::vector<StringRef> &Pieces, 376 const TargetInfo &TI) { 377 if (isMSAsmKeyword(Pieces[0])) 378 return false; 379 380 for (unsigned i = 1, e = Pieces.size(); i != e; ++i) 381 if (!TI.isValidGCCRegisterName(Pieces[i])) 382 return false; 383 return true; 384} 385 386// Determine if this is a simple MSAsm block. 387static bool isSimpleMSAsm(std::vector<std::vector<StringRef> > Pieces, 388 const TargetInfo &TI) { 389 for (unsigned i = 0, e = Pieces.size(); i != e; ++i) 390 if (!isSimpleMSAsm(Pieces[i], TI)) 391 return false; 392 return true; 393} 394 395// Break the AsmString into pieces (i.e., mnemonic and operands). 396static void buildMSAsmPieces(StringRef Asm, std::vector<StringRef> &Pieces) { 397 std::pair<StringRef,StringRef> Split = Asm.split(' '); 398 399 // Mnemonic 400 Pieces.push_back(Split.first); 401 Asm = Split.second; 402 403 // Operands 404 while (!Asm.empty()) { 405 Split = Asm.split(", "); 406 Pieces.push_back(Split.first); 407 Asm = Split.second; 408 } 409} 410 411static void buildMSAsmPieces(std::vector<std::string> &AsmStrings, 412 std::vector<std::vector<StringRef> > &Pieces) { 413 for (unsigned i = 0, e = AsmStrings.size(); i != e; ++i) 414 buildMSAsmPieces(AsmStrings[i], Pieces[i]); 415} 416 417// Build the individual assembly instruction(s) and place them in the AsmStrings 418// vector. These strings are fed to the AsmParser. Returns true on error. 419static bool buildMSAsmStrings(Sema &SemaRef, 420 SourceLocation AsmLoc, 421 ArrayRef<Token> AsmToks, 422 std::vector<std::string> &AsmStrings, 423 std::vector<std::pair<unsigned,unsigned> > &AsmTokRanges) { 424 assert (!AsmToks.empty() && "Didn't expect an empty AsmToks!"); 425 426 SmallString<512> Asm; 427 unsigned startTok = 0; 428 for (unsigned i = 0, e = AsmToks.size(); i < e; ++i) { 429 bool isNewAsm = ((i == 0) || 430 AsmToks[i].isAtStartOfLine() || 431 AsmToks[i].is(tok::kw_asm)); 432 433 if (isNewAsm) { 434 if (i) { 435 AsmStrings.push_back(Asm.str()); 436 AsmTokRanges.push_back(std::make_pair(startTok, i-1)); 437 startTok = i; 438 Asm.clear(); 439 } 440 if (AsmToks[i].is(tok::kw_asm)) { 441 i++; // Skip __asm 442 if (i == e) { 443 SemaRef.Diag(AsmLoc, diag::err_asm_empty); 444 return true; 445 } 446 } 447 } 448 449 if (i && AsmToks[i].hasLeadingSpace() && !isNewAsm) 450 Asm += ' '; 451 452 StringRef Spelling = getSpelling(SemaRef, AsmToks[i]); 453 Asm += Spelling; 454 } 455 AsmStrings.push_back(Asm.str()); 456 AsmTokRanges.push_back(std::make_pair(startTok, AsmToks.size()-1)); 457 458 return false; 459} 460 461// Check to see if the expression is a substring of the asm operand. 462static StringRef getMSInlineAsmExprName(StringRef Name) { 463 // Strip off the size directives. 464 // E.g., DWORD PTR [V] -> V 465 if (Name.startswith("BYTE") || Name.startswith("byte") || 466 Name.startswith("WORD") || Name.startswith("word") || 467 Name.startswith("DWORD") || Name.startswith("dword") || 468 Name.startswith("QWORD") || Name.startswith("qword") || 469 Name.startswith("XWORD") || Name.startswith("xword") || 470 Name.startswith("XMMWORD") || Name.startswith("xmmword") || 471 Name.startswith("YMMWORD") || Name.startswith("ymmword")) { 472 std::pair< StringRef, StringRef > SplitName = Name.split(' '); 473 assert((SplitName.second.startswith("PTR") || 474 SplitName.second.startswith("ptr")) && 475 "Expected PTR/ptr!"); 476 SplitName = SplitName.second.split('['); 477 SplitName = SplitName.second.split(']'); 478 return SplitName.first; 479 } 480 return Name; 481} 482 483#define DEF_SIMPLE_MSASM(STR) \ 484 MSAsmStmt *NS = \ 485 new (Context) MSAsmStmt(Context, AsmLoc, LBraceLoc, /*IsSimple*/ true, \ 486 /*IsVolatile*/ true, AsmToks, Inputs, Outputs, \ 487 InputExprs, OutputExprs, STR, Constraints, \ 488 Clobbers, EndLoc); 489 490StmtResult Sema::ActOnMSAsmStmt(SourceLocation AsmLoc, SourceLocation LBraceLoc, 491 ArrayRef<Token> AsmToks,SourceLocation EndLoc) { 492 SmallVector<StringRef, 4> Constraints; 493 std::vector<std::string> InputConstraints; 494 std::vector<std::string> OutputConstraints; 495 SmallVector<StringRef, 4> Clobbers; 496 std::set<std::string> ClobberRegs; 497 498 // FIXME: Use a struct to hold the various expression information. 499 SmallVector<IdentifierInfo*, 4> Inputs; 500 SmallVector<IdentifierInfo*, 4> Outputs; 501 SmallVector<Expr*, 4> InputExprs; 502 SmallVector<Expr*, 4> OutputExprs; 503 SmallVector<std::string, 4> InputExprNames; 504 SmallVector<std::string, 4> OutputExprNames; 505 SmallVector<unsigned, 4> InputExprStrIdx; 506 SmallVector<unsigned, 4> OutputExprStrIdx; 507 508 // Empty asm statements don't need to instantiate the AsmParser, etc. 509 StringRef EmptyAsmStr; 510 if (AsmToks.empty()) { DEF_SIMPLE_MSASM(EmptyAsmStr); return Owned(NS); } 511 512 std::vector<std::string> AsmStrings; 513 std::vector<std::pair<unsigned,unsigned> > AsmTokRanges; 514 if (buildMSAsmStrings(*this, AsmLoc, AsmToks, AsmStrings, AsmTokRanges)) 515 return StmtError(); 516 517 std::vector<std::vector<StringRef> > Pieces(AsmStrings.size()); 518 buildMSAsmPieces(AsmStrings, Pieces); 519 520 bool IsSimple = isSimpleMSAsm(Pieces, Context.getTargetInfo()); 521 522 // AsmParser doesn't fully support these asm statements. 523 if (bailOnMSAsm(Pieces)) { DEF_SIMPLE_MSASM(EmptyAsmStr); return Owned(NS); } 524 525 // Get the target specific parser. 526 std::string Error; 527 const std::string &TT = Context.getTargetInfo().getTriple().getTriple(); 528 const llvm::Target *TheTarget(llvm::TargetRegistry::lookupTarget(TT, Error)); 529 530 OwningPtr<llvm::MCAsmInfo> MAI(TheTarget->createMCAsmInfo(TT)); 531 OwningPtr<llvm::MCRegisterInfo> MRI(TheTarget->createMCRegInfo(TT)); 532 OwningPtr<llvm::MCObjectFileInfo> MOFI(new llvm::MCObjectFileInfo()); 533 OwningPtr<llvm::MCSubtargetInfo> 534 STI(TheTarget->createMCSubtargetInfo(TT, "", "")); 535 536 for (unsigned StrIdx = 0, e = AsmStrings.size(); StrIdx != e; ++StrIdx) { 537 llvm::SourceMgr SrcMgr; 538 llvm::MCContext Ctx(*MAI, *MRI, MOFI.get(), &SrcMgr); 539 llvm::MemoryBuffer *Buffer = 540 llvm::MemoryBuffer::getMemBuffer(AsmStrings[StrIdx], "<inline asm>"); 541 542 // Tell SrcMgr about this buffer, which is what the parser will pick up. 543 SrcMgr.AddNewSourceBuffer(Buffer, llvm::SMLoc()); 544 545 OwningPtr<llvm::MCStreamer> Str(createNullStreamer(Ctx)); 546 OwningPtr<llvm::MCAsmParser> 547 Parser(createMCAsmParser(SrcMgr, Ctx, *Str.get(), *MAI)); 548 OwningPtr<llvm::MCTargetAsmParser> 549 TargetParser(TheTarget->createMCAsmParser(*STI, *Parser)); 550 // Change to the Intel dialect. 551 Parser->setAssemblerDialect(1); 552 Parser->setTargetParser(*TargetParser.get()); 553 554 // Prime the lexer. 555 Parser->Lex(); 556 557 // Parse the opcode. 558 StringRef IDVal; 559 Parser->ParseIdentifier(IDVal); 560 561 // Canonicalize the opcode to lower case. 562 SmallString<128> OpcodeStr; 563 for (unsigned i = 0, e = IDVal.size(); i != e; ++i) 564 OpcodeStr.push_back(tolower(IDVal[i])); 565 // FIXME: Convert to a StmtError. 566 assert(TargetParser->mnemonicIsValid(OpcodeStr) && "Invalid mnemonic!"); 567 568 // Parse the operands. 569 llvm::SMLoc IDLoc; 570 SmallVector<llvm::MCParsedAsmOperand*, 8> Operands; 571 bool HadError = TargetParser->ParseInstruction(OpcodeStr.str(), IDLoc, 572 Operands); 573 // If we had an error parsing the operands, fail gracefully. 574 if (HadError) { DEF_SIMPLE_MSASM(EmptyAsmStr); return Owned(NS); } 575 576 // Match the MCInstr. 577 unsigned Kind; 578 unsigned Opcode; 579 unsigned ErrorInfo; 580 SmallVector<std::pair< unsigned, std::string >, 4> MapAndConstraints; 581 HadError = TargetParser->MatchInstruction(IDLoc, Operands, *Str.get(), Kind, 582 Opcode, MapAndConstraints, 583 ErrorInfo, 584 /*matchingInlineAsm*/ true); 585 // If we had an error parsing the operands, fail gracefully. 586 if (HadError) { DEF_SIMPLE_MSASM(EmptyAsmStr); return Owned(NS); } 587 588 // Get the instruction descriptor. 589 const llvm::MCInstrInfo *MII = TheTarget->createMCInstrInfo(); 590 const llvm::MCInstrDesc &Desc = MII->get(Opcode); 591 llvm::MCInstPrinter *IP = 592 TheTarget->createMCInstPrinter(1, *MAI, *MII, *MRI, *STI); 593 594 // Build the list of clobbers, outputs and inputs. 595 unsigned NumDefs = Desc.getNumDefs(); 596 for (unsigned i = 1, e = Operands.size(); i != e; ++i) { 597 // Skip immediates. 598 if (Operands[i]->isImm()) 599 continue; 600 601 // Register. 602 if (Operands[i]->isReg()) { 603 // Clobber. 604 if (NumDefs && (MapAndConstraints[i-1].first < NumDefs)) { 605 std::string Reg; 606 llvm::raw_string_ostream OS(Reg); 607 IP->printRegName(OS, Operands[i]->getReg()); 608 StringRef Clobber(OS.str()); 609 if (!Context.getTargetInfo().isValidClobber(Clobber)) 610 return StmtError( 611 Diag(AsmLoc, diag::err_asm_unknown_register_name) << Clobber); 612 ClobberRegs.insert(Reg); 613 } 614 continue; 615 } 616 617 // Expr/Input or Output. 618 StringRef Name = getMSInlineAsmExprName(Pieces[StrIdx][i]); 619 620 // The expr may be a register. 621 // E.g., DWORD PTR [eax] 622 if (Context.getTargetInfo().isValidGCCRegisterName(Name)) 623 continue; 624 625 IdentifierInfo *II = getIdentifierInfo(Name, AsmToks, 626 AsmTokRanges[StrIdx].first, 627 AsmTokRanges[StrIdx].second); 628 if (II) { 629 CXXScopeSpec SS; 630 UnqualifiedId Id; 631 SourceLocation Loc; 632 Id.setIdentifier(II, AsmLoc); 633 ExprResult Result = ActOnIdExpression(getCurScope(), SS, Loc, Id, 634 false, false); 635 if (!Result.isInvalid()) { 636 // FIXME: Determine the proper constraints. 637 bool isMemDef = (i == 1) && Desc.mayStore(); 638 if (isMemDef) { 639 Outputs.push_back(II); 640 OutputExprs.push_back(Result.take()); 641 OutputExprNames.push_back(Name.str()); 642 OutputExprStrIdx.push_back(StrIdx); 643 644 std::string Constraint = "=" + MapAndConstraints[i-1].second; 645 OutputConstraints.push_back(Constraint); 646 } else { 647 Inputs.push_back(II); 648 InputExprs.push_back(Result.take()); 649 InputExprNames.push_back(Name.str()); 650 InputExprStrIdx.push_back(StrIdx); 651 InputConstraints.push_back(MapAndConstraints[i-1].second); 652 } 653 } 654 } 655 } 656 } 657 for (std::set<std::string>::iterator I = ClobberRegs.begin(), 658 E = ClobberRegs.end(); I != E; ++I) 659 Clobbers.push_back(*I); 660 661 // Merge the output and input constraints. Output constraints are expected 662 // first. 663 for (std::vector<std::string>::iterator I = OutputConstraints.begin(), 664 E = OutputConstraints.end(); I != E; ++I) 665 Constraints.push_back(*I); 666 667 for (std::vector<std::string>::iterator I = InputConstraints.begin(), 668 E = InputConstraints.end(); I != E; ++I) 669 Constraints.push_back(*I); 670 671 // Enumerate the AsmString expressions. 672 unsigned OpNum = 0; 673 for (unsigned i = 0, e = OutputExprNames.size(); i != e; ++i, ++OpNum) { 674 unsigned StrIdx = OutputExprStrIdx[i]; 675 // Iterate over the assembly instruction pieces, skipping the mnemonic. 676 for (unsigned j = 1, f = Pieces[StrIdx].size(); j != f; ++j) { 677 // If the operand and the expression name match, then rewrite the operand. 678 if (OutputExprNames[i] == Pieces[StrIdx][j]) { 679 SmallString<32> Res; 680 llvm::raw_svector_ostream OS(Res); 681 OS << '$' << OpNum; 682 OutputExprNames[i] = OS.str(); 683 Pieces[StrIdx][j] = OutputExprNames[i]; 684 break; 685 } 686 // Check to see if the expression is a substring of the asm piece. 687 std::pair< StringRef, StringRef > Split = Pieces[StrIdx][j].split(' '); 688 bool isKeyword = llvm::StringSwitch<bool>(Split.first) 689 .Cases("BYTE", "byte", "WORD", "word", "DWORD", true) 690 .Cases("dword", "QWORD", "qword", "XWORD", "xword", true) 691 .Cases("XMMWORD", "xmmword", "YMMWORD", "ymmword", true) 692 .Default(false); 693 if (isKeyword && 694 Split.second.find_first_of(OutputExprNames[i]) != StringRef::npos) { 695 // Is is a substring, do the replacement. 696 SmallString<32> Res; 697 llvm::raw_svector_ostream OS(Res); 698 OS << '$' << OpNum; 699 std::string piece = Pieces[StrIdx][j].str(); 700 size_t found = piece.find(InputExprNames[i]); 701 piece.replace(found, InputExprNames[i].size(), OS.str()); 702 OutputExprNames[i] = piece; 703 Pieces[StrIdx][j] = OutputExprNames[i]; 704 break; 705 } 706 } 707 } 708 for (unsigned i = 0, e = InputExprNames.size(); i != e; ++i, ++OpNum) { 709 unsigned StrIdx = InputExprStrIdx[i]; 710 // Iterate over the assembly instruction pieces, skipping the mnemonic. 711 for (unsigned j = 1, f = Pieces[StrIdx].size(); j != f; ++j) { 712 // If the operand and the expression name match, then rewrite the operand. 713 if (InputExprNames[i] == Pieces[StrIdx][j]) { 714 SmallString<32> Res; 715 llvm::raw_svector_ostream OS(Res); 716 OS << '$' << OpNum; 717 InputExprNames[i] = OS.str(); 718 Pieces[StrIdx][j] = InputExprNames[i]; 719 break; 720 } 721 // Check to see if the expression is a substring of the asm piece. 722 std::pair< StringRef, StringRef > Split = Pieces[StrIdx][j].split(' '); 723 bool isKeyword = llvm::StringSwitch<bool>(Split.first) 724 .Cases("BYTE", "byte", "WORD", "word", "DWORD", true) 725 .Cases("dword", "QWORD", "qword", "XWORD", "xword", true) 726 .Cases("XMMWORD", "xmmword", "YMMWORD", "ymmword", true) 727 .Default(false); 728 if (isKeyword && 729 Split.second.find_first_of(InputExprNames[i]) != StringRef::npos) { 730 // It is a substring, do the replacement. 731 SmallString<32> Res; 732 llvm::raw_svector_ostream OS(Res); 733 OS << '$' << OpNum; 734 std::string piece = Pieces[StrIdx][j].str(); 735 size_t found = piece.find(InputExprNames[i]); 736 piece.replace(found, InputExprNames[i].size(), OS.str()); 737 InputExprNames[i] = piece; 738 Pieces[StrIdx][j] = InputExprNames[i]; 739 break; 740 } 741 } 742 } 743 744 // Emit the IR assembly string. 745 std::string AsmString; 746 for (unsigned i = 0, e = Pieces.size(); i != e; ++i) { 747 // Skip empty asm stmts. 748 if (Pieces[i].empty()) continue; 749 750 if (i > 0) 751 AsmString += "\n\t"; 752 753 // Emit the mnemonic. 754 AsmString += Pieces[i][0]; 755 if (Pieces[i].size() > 1) 756 AsmString += ' '; 757 758 // Emit the operands adding $$ to constants. 759 for (unsigned j = 1, f = Pieces[i].size(); j != f; ++j) { 760 if (j > 1) AsmString += ", "; 761 unsigned Val; 762 if (!Pieces[i][j].getAsInteger(0, Val)) 763 AsmString += "$$"; 764 765 AsmString += Pieces[i][j]; 766 } 767 } 768 769 MSAsmStmt *NS = 770 new (Context) MSAsmStmt(Context, AsmLoc, LBraceLoc, IsSimple, 771 /*IsVolatile*/ true, AsmToks, Inputs, Outputs, 772 InputExprs, OutputExprs, AsmString, Constraints, 773 Clobbers, EndLoc); 774 return Owned(NS); 775} 776