blob: 94223e43845c1c7ad73a7ae5fa3f1971607d6dd2 [file] [log] [blame]
Chad Rosier3d45a772012-08-17 21:27:25 +00001//===--- SemaStmtAsm.cpp - Semantic Analysis for Asm Statements -----------===//
Chad Rosier4b5e48d2012-08-17 21:19:40 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements semantic analysis for inline asm statements.
11//
12//===----------------------------------------------------------------------===//
13
14#include "clang/Sema/SemaInternal.h"
15#include "clang/Sema/Scope.h"
16#include "clang/Sema/ScopeInfo.h"
17#include "clang/Sema/Initialization.h"
18#include "clang/Sema/Lookup.h"
19#include "clang/AST/TypeLoc.h"
20#include "clang/Lex/Preprocessor.h"
21#include "clang/Basic/TargetInfo.h"
22#include "llvm/ADT/ArrayRef.h"
23#include "llvm/ADT/BitVector.h"
24#include "llvm/ADT/SmallString.h"
25#include "llvm/MC/MCAsmInfo.h"
26#include "llvm/MC/MCContext.h"
27#include "llvm/MC/MCInst.h"
28#include "llvm/MC/MCInstPrinter.h"
29#include "llvm/MC/MCInstrInfo.h"
30#include "llvm/MC/MCObjectFileInfo.h"
31#include "llvm/MC/MCRegisterInfo.h"
32#include "llvm/MC/MCStreamer.h"
33#include "llvm/MC/MCSubtargetInfo.h"
34#include "llvm/MC/MCTargetAsmParser.h"
35#include "llvm/MC/MCParser/MCAsmLexer.h"
36#include "llvm/MC/MCParser/MCAsmParser.h"
37#include "llvm/Support/SourceMgr.h"
38#include "llvm/Support/TargetRegistry.h"
39#include "llvm/Support/TargetSelect.h"
40using namespace clang;
41using namespace sema;
42
43/// CheckAsmLValue - GNU C has an extremely ugly extension whereby they silently
44/// ignore "noop" casts in places where an lvalue is required by an inline asm.
45/// We emulate this behavior when -fheinous-gnu-extensions is specified, but
46/// provide a strong guidance to not use it.
47///
48/// This method checks to see if the argument is an acceptable l-value and
49/// returns false if it is a case we can handle.
50static bool CheckAsmLValue(const Expr *E, Sema &S) {
51 // Type dependent expressions will be checked during instantiation.
52 if (E->isTypeDependent())
53 return false;
54
55 if (E->isLValue())
56 return false; // Cool, this is an lvalue.
57
58 // Okay, this is not an lvalue, but perhaps it is the result of a cast that we
59 // are supposed to allow.
60 const Expr *E2 = E->IgnoreParenNoopCasts(S.Context);
61 if (E != E2 && E2->isLValue()) {
62 if (!S.getLangOpts().HeinousExtensions)
63 S.Diag(E2->getLocStart(), diag::err_invalid_asm_cast_lvalue)
64 << E->getSourceRange();
65 else
66 S.Diag(E2->getLocStart(), diag::warn_invalid_asm_cast_lvalue)
67 << E->getSourceRange();
68 // Accept, even if we emitted an error diagnostic.
69 return false;
70 }
71
72 // None of the above, just randomly invalid non-lvalue.
73 return true;
74}
75
76/// isOperandMentioned - Return true if the specified operand # is mentioned
77/// anywhere in the decomposed asm string.
78static bool isOperandMentioned(unsigned OpNo,
79 ArrayRef<AsmStmt::AsmStringPiece> AsmStrPieces) {
80 for (unsigned p = 0, e = AsmStrPieces.size(); p != e; ++p) {
81 const AsmStmt::AsmStringPiece &Piece = AsmStrPieces[p];
82 if (!Piece.isOperand()) continue;
83
84 // If this is a reference to the input and if the input was the smaller
85 // one, then we have to reject this asm.
86 if (Piece.getOperandNo() == OpNo)
87 return true;
88 }
89 return false;
90}
91
92StmtResult Sema::ActOnAsmStmt(SourceLocation AsmLoc, bool IsSimple,
93 bool IsVolatile, unsigned NumOutputs,
94 unsigned NumInputs, IdentifierInfo **Names,
95 MultiExprArg constraints, MultiExprArg exprs,
96 Expr *asmString, MultiExprArg clobbers,
Chad Rosierdf4ee102012-08-20 17:11:53 +000097 SourceLocation RParenLoc) {
Chad Rosier4b5e48d2012-08-17 21:19:40 +000098 unsigned NumClobbers = clobbers.size();
99 StringLiteral **Constraints =
100 reinterpret_cast<StringLiteral**>(constraints.get());
101 Expr **Exprs = exprs.get();
102 StringLiteral *AsmString = cast<StringLiteral>(asmString);
103 StringLiteral **Clobbers = reinterpret_cast<StringLiteral**>(clobbers.get());
104
105 SmallVector<TargetInfo::ConstraintInfo, 4> OutputConstraintInfos;
106
107 // The parser verifies that there is a string literal here.
108 if (!AsmString->isAscii())
109 return StmtError(Diag(AsmString->getLocStart(),diag::err_asm_wide_character)
110 << AsmString->getSourceRange());
111
112 for (unsigned i = 0; i != NumOutputs; i++) {
113 StringLiteral *Literal = Constraints[i];
114 if (!Literal->isAscii())
115 return StmtError(Diag(Literal->getLocStart(),diag::err_asm_wide_character)
116 << Literal->getSourceRange());
117
118 StringRef OutputName;
119 if (Names[i])
120 OutputName = Names[i]->getName();
121
122 TargetInfo::ConstraintInfo Info(Literal->getString(), OutputName);
123 if (!Context.getTargetInfo().validateOutputConstraint(Info))
124 return StmtError(Diag(Literal->getLocStart(),
125 diag::err_asm_invalid_output_constraint)
126 << Info.getConstraintStr());
127
128 // Check that the output exprs are valid lvalues.
129 Expr *OutputExpr = Exprs[i];
130 if (CheckAsmLValue(OutputExpr, *this)) {
131 return StmtError(Diag(OutputExpr->getLocStart(),
132 diag::err_asm_invalid_lvalue_in_output)
133 << OutputExpr->getSourceRange());
134 }
135
136 OutputConstraintInfos.push_back(Info);
137 }
138
139 SmallVector<TargetInfo::ConstraintInfo, 4> InputConstraintInfos;
140
141 for (unsigned i = NumOutputs, e = NumOutputs + NumInputs; i != e; i++) {
142 StringLiteral *Literal = Constraints[i];
143 if (!Literal->isAscii())
144 return StmtError(Diag(Literal->getLocStart(),diag::err_asm_wide_character)
145 << Literal->getSourceRange());
146
147 StringRef InputName;
148 if (Names[i])
149 InputName = Names[i]->getName();
150
151 TargetInfo::ConstraintInfo Info(Literal->getString(), InputName);
152 if (!Context.getTargetInfo().validateInputConstraint(OutputConstraintInfos.data(),
153 NumOutputs, Info)) {
154 return StmtError(Diag(Literal->getLocStart(),
155 diag::err_asm_invalid_input_constraint)
156 << Info.getConstraintStr());
157 }
158
159 Expr *InputExpr = Exprs[i];
160
161 // Only allow void types for memory constraints.
162 if (Info.allowsMemory() && !Info.allowsRegister()) {
163 if (CheckAsmLValue(InputExpr, *this))
164 return StmtError(Diag(InputExpr->getLocStart(),
165 diag::err_asm_invalid_lvalue_in_input)
166 << Info.getConstraintStr()
167 << InputExpr->getSourceRange());
168 }
169
170 if (Info.allowsRegister()) {
171 if (InputExpr->getType()->isVoidType()) {
172 return StmtError(Diag(InputExpr->getLocStart(),
173 diag::err_asm_invalid_type_in_input)
174 << InputExpr->getType() << Info.getConstraintStr()
175 << InputExpr->getSourceRange());
176 }
177 }
178
179 ExprResult Result = DefaultFunctionArrayLvalueConversion(Exprs[i]);
180 if (Result.isInvalid())
181 return StmtError();
182
183 Exprs[i] = Result.take();
184 InputConstraintInfos.push_back(Info);
185 }
186
187 // Check that the clobbers are valid.
188 for (unsigned i = 0; i != NumClobbers; i++) {
189 StringLiteral *Literal = Clobbers[i];
190 if (!Literal->isAscii())
191 return StmtError(Diag(Literal->getLocStart(),diag::err_asm_wide_character)
192 << Literal->getSourceRange());
193
194 StringRef Clobber = Literal->getString();
195
196 if (!Context.getTargetInfo().isValidClobber(Clobber))
197 return StmtError(Diag(Literal->getLocStart(),
198 diag::err_asm_unknown_register_name) << Clobber);
199 }
200
201 AsmStmt *NS =
Chad Rosierdf4ee102012-08-20 17:11:53 +0000202 new (Context) AsmStmt(Context, AsmLoc, IsSimple, IsVolatile, NumOutputs,
203 NumInputs, Names, Constraints, Exprs, AsmString,
204 NumClobbers, Clobbers, RParenLoc);
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000205 // Validate the asm string, ensuring it makes sense given the operands we
206 // have.
207 SmallVector<AsmStmt::AsmStringPiece, 8> Pieces;
208 unsigned DiagOffs;
209 if (unsigned DiagID = NS->AnalyzeAsmString(Pieces, Context, DiagOffs)) {
210 Diag(getLocationOfStringLiteralByte(AsmString, DiagOffs), DiagID)
211 << AsmString->getSourceRange();
212 return StmtError();
213 }
214
215 // Validate tied input operands for type mismatches.
216 for (unsigned i = 0, e = InputConstraintInfos.size(); i != e; ++i) {
217 TargetInfo::ConstraintInfo &Info = InputConstraintInfos[i];
218
219 // If this is a tied constraint, verify that the output and input have
220 // either exactly the same type, or that they are int/ptr operands with the
221 // same size (int/long, int*/long, are ok etc).
222 if (!Info.hasTiedOperand()) continue;
223
224 unsigned TiedTo = Info.getTiedOperand();
225 unsigned InputOpNo = i+NumOutputs;
226 Expr *OutputExpr = Exprs[TiedTo];
227 Expr *InputExpr = Exprs[InputOpNo];
228
229 if (OutputExpr->isTypeDependent() || InputExpr->isTypeDependent())
230 continue;
231
232 QualType InTy = InputExpr->getType();
233 QualType OutTy = OutputExpr->getType();
234 if (Context.hasSameType(InTy, OutTy))
235 continue; // All types can be tied to themselves.
236
237 // Decide if the input and output are in the same domain (integer/ptr or
238 // floating point.
239 enum AsmDomain {
240 AD_Int, AD_FP, AD_Other
241 } InputDomain, OutputDomain;
242
243 if (InTy->isIntegerType() || InTy->isPointerType())
244 InputDomain = AD_Int;
245 else if (InTy->isRealFloatingType())
246 InputDomain = AD_FP;
247 else
248 InputDomain = AD_Other;
249
250 if (OutTy->isIntegerType() || OutTy->isPointerType())
251 OutputDomain = AD_Int;
252 else if (OutTy->isRealFloatingType())
253 OutputDomain = AD_FP;
254 else
255 OutputDomain = AD_Other;
256
257 // They are ok if they are the same size and in the same domain. This
258 // allows tying things like:
259 // void* to int*
260 // void* to int if they are the same size.
261 // double to long double if they are the same size.
262 //
263 uint64_t OutSize = Context.getTypeSize(OutTy);
264 uint64_t InSize = Context.getTypeSize(InTy);
265 if (OutSize == InSize && InputDomain == OutputDomain &&
266 InputDomain != AD_Other)
267 continue;
268
269 // If the smaller input/output operand is not mentioned in the asm string,
270 // then we can promote the smaller one to a larger input and the asm string
271 // won't notice.
272 bool SmallerValueMentioned = false;
273
274 // If this is a reference to the input and if the input was the smaller
275 // one, then we have to reject this asm.
276 if (isOperandMentioned(InputOpNo, Pieces)) {
277 // This is a use in the asm string of the smaller operand. Since we
278 // codegen this by promoting to a wider value, the asm will get printed
279 // "wrong".
280 SmallerValueMentioned |= InSize < OutSize;
281 }
282 if (isOperandMentioned(TiedTo, Pieces)) {
283 // If this is a reference to the output, and if the output is the larger
284 // value, then it's ok because we'll promote the input to the larger type.
285 SmallerValueMentioned |= OutSize < InSize;
286 }
287
288 // If the smaller value wasn't mentioned in the asm string, and if the
289 // output was a register, just extend the shorter one to the size of the
290 // larger one.
291 if (!SmallerValueMentioned && InputDomain != AD_Other &&
292 OutputConstraintInfos[TiedTo].allowsRegister())
293 continue;
294
295 // Either both of the operands were mentioned or the smaller one was
296 // mentioned. One more special case that we'll allow: if the tied input is
297 // integer, unmentioned, and is a constant, then we'll allow truncating it
298 // down to the size of the destination.
299 if (InputDomain == AD_Int && OutputDomain == AD_Int &&
300 !isOperandMentioned(InputOpNo, Pieces) &&
301 InputExpr->isEvaluatable(Context)) {
302 CastKind castKind =
303 (OutTy->isBooleanType() ? CK_IntegralToBoolean : CK_IntegralCast);
304 InputExpr = ImpCastExprToType(InputExpr, OutTy, castKind).take();
305 Exprs[InputOpNo] = InputExpr;
306 NS->setInputExpr(i, InputExpr);
307 continue;
308 }
309
310 Diag(InputExpr->getLocStart(),
311 diag::err_asm_tying_incompatible_types)
312 << InTy << OutTy << OutputExpr->getSourceRange()
313 << InputExpr->getSourceRange();
314 return StmtError();
315 }
316
317 return Owned(NS);
318}
319
320// isMSAsmKeyword - Return true if this is an MS-style inline asm keyword. These
321// require special handling.
322static bool isMSAsmKeyword(StringRef Name) {
323 bool Ret = llvm::StringSwitch<bool>(Name)
324 .Cases("EVEN", "ALIGN", true) // Alignment directives.
325 .Cases("LENGTH", "SIZE", "TYPE", true) // Type and variable sizes.
326 .Case("_emit", true) // _emit Pseudoinstruction.
327 .Default(false);
328 return Ret;
329}
330
331static StringRef getSpelling(Sema &SemaRef, Token AsmTok) {
332 StringRef Asm;
333 SmallString<512> TokenBuf;
334 TokenBuf.resize(512);
335 bool StringInvalid = false;
336 Asm = SemaRef.PP.getSpelling(AsmTok, TokenBuf, &StringInvalid);
337 assert (!StringInvalid && "Expected valid string!");
338 return Asm;
339}
340
341static void patchMSAsmStrings(Sema &SemaRef, bool &IsSimple,
342 SourceLocation AsmLoc,
343 ArrayRef<Token> AsmToks,
344 const TargetInfo &TI,
345 std::vector<llvm::BitVector> &AsmRegs,
346 std::vector<llvm::BitVector> &AsmNames,
347 std::vector<std::string> &AsmStrings) {
348 assert (!AsmToks.empty() && "Didn't expect an empty AsmToks!");
349
350 // Assume simple asm stmt until we parse a non-register identifer (or we just
351 // need to bail gracefully).
352 IsSimple = true;
353
354 SmallString<512> Asm;
355 unsigned NumAsmStrings = 0;
356 for (unsigned i = 0, e = AsmToks.size(); i != e; ++i) {
357
358 // Determine if this should be considered a new asm.
359 bool isNewAsm = i == 0 || AsmToks[i].isAtStartOfLine() ||
360 AsmToks[i].is(tok::kw_asm);
361
362 // Emit the previous asm string.
363 if (i && isNewAsm) {
364 AsmStrings[NumAsmStrings++] = Asm.c_str();
365 if (AsmToks[i].is(tok::kw_asm)) {
366 ++i; // Skip __asm
367 assert (i != e && "Expected another token.");
368 }
369 }
370
371 // Start a new asm string with the opcode.
372 if (isNewAsm) {
373 AsmRegs[NumAsmStrings].resize(AsmToks.size());
374 AsmNames[NumAsmStrings].resize(AsmToks.size());
375
376 StringRef Piece = AsmToks[i].getIdentifierInfo()->getName();
377 // MS-style inline asm keywords require special handling.
378 if (isMSAsmKeyword(Piece))
379 IsSimple = false;
380
381 // TODO: Verify this is a valid opcode.
382 Asm = Piece;
383 continue;
384 }
385
386 if (i && AsmToks[i].hasLeadingSpace())
387 Asm += ' ';
388
389 // Check the operand(s).
390 switch (AsmToks[i].getKind()) {
391 default:
392 IsSimple = false;
393 Asm += getSpelling(SemaRef, AsmToks[i]);
394 break;
395 case tok::comma: Asm += ","; break;
396 case tok::colon: Asm += ":"; break;
397 case tok::l_square: Asm += "["; break;
398 case tok::r_square: Asm += "]"; break;
399 case tok::l_brace: Asm += "{"; break;
400 case tok::r_brace: Asm += "}"; break;
401 case tok::numeric_constant:
402 Asm += getSpelling(SemaRef, AsmToks[i]);
403 break;
404 case tok::identifier: {
405 IdentifierInfo *II = AsmToks[i].getIdentifierInfo();
406 StringRef Name = II->getName();
407
408 // Valid register?
409 if (TI.isValidGCCRegisterName(Name)) {
410 AsmRegs[NumAsmStrings].set(i);
411 Asm += Name;
412 break;
413 }
414
415 IsSimple = false;
416
417 // MS-style inline asm keywords require special handling.
418 if (isMSAsmKeyword(Name)) {
419 IsSimple = false;
420 Asm += Name;
421 break;
422 }
423
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000424 // Lookup the identifier.
425 // TODO: Someone with more experience with clang should verify this the
426 // proper way of doing a symbol lookup.
427 DeclarationName DeclName(II);
428 Scope *CurScope = SemaRef.getCurScope();
429 LookupResult R(SemaRef, DeclName, AsmLoc, Sema::LookupOrdinaryName);
430 if (!SemaRef.LookupName(R, CurScope, false/*AllowBuiltinCreation*/))
431 break;
432
433 assert (R.isSingleResult() && "Expected a single result?!");
434 NamedDecl *Decl = R.getFoundDecl();
435 switch (Decl->getKind()) {
436 default:
437 assert(0 && "Unknown decl kind.");
438 break;
439 case Decl::Var: {
440 case Decl::ParmVar:
441 AsmNames[NumAsmStrings].set(i);
442
443 VarDecl *Var = cast<VarDecl>(Decl);
444 QualType Ty = Var->getType();
445 (void)Ty; // Avoid warning.
446 // TODO: Patch identifier with valid operand. One potential idea is to
447 // probe the backend with type information to guess the possible
448 // operand.
Chad Rosier33a71f32012-08-21 17:02:27 +0000449 Asm += getSpelling(SemaRef, AsmToks[i]);
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000450 break;
451 }
452 }
453 break;
454 }
455 }
456 }
457
458 // Emit the final (and possibly only) asm string.
459 AsmStrings[NumAsmStrings] = Asm.c_str();
460}
461
Chad Rosier38c71d32012-08-21 21:56:39 +0000462// Break the AsmSting into pieces.
463static void buildMSAsmPieces(StringRef Asm, std::vector<StringRef> &Pieces) {
464 std::pair<StringRef,StringRef> Split = Asm.split(' ');
465
466 // Mnemonic
467 Pieces.push_back(Split.first);
468 Asm = Split.second;
469
470 // Operands
471 while (!Asm.empty()) {
472 Split = Asm.split(", ");
473 Pieces.push_back(Split.first);
474 Asm = Split.second;
475 }
476}
477
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000478// Build the unmodified MSAsmString.
479static std::string buildMSAsmString(Sema &SemaRef,
480 ArrayRef<Token> AsmToks,
Chad Rosier38c71d32012-08-21 21:56:39 +0000481 std::vector<std::string> &AsmStrings) {
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000482 assert (!AsmToks.empty() && "Didn't expect an empty AsmToks!");
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000483
Chad Rosier38c71d32012-08-21 21:56:39 +0000484 SmallString<512> Res;
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000485 SmallString<512> Asm;
486 for (unsigned i = 0, e = AsmToks.size(); i < e; ++i) {
487 bool isNewAsm = i == 0 || AsmToks[i].isAtStartOfLine() ||
488 AsmToks[i].is(tok::kw_asm);
489
490 if (isNewAsm) {
Chad Rosier38c71d32012-08-21 21:56:39 +0000491 if (i) {
492 AsmStrings.push_back(Asm.c_str());
493 Res += Asm;
494 Asm.clear();
495 Res += '\n';
496 }
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000497 if (AsmToks[i].is(tok::kw_asm)) {
498 i++; // Skip __asm
499 assert (i != e && "Expected another token");
500 }
501 }
502
503 if (i && AsmToks[i].hasLeadingSpace() && !isNewAsm)
504 Asm += ' ';
505
506 Asm += getSpelling(SemaRef, AsmToks[i]);
507 }
Chad Rosier38c71d32012-08-21 21:56:39 +0000508 AsmStrings.push_back(Asm.c_str());
509 Res += Asm;
510 return Res.c_str();
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000511}
512
513StmtResult Sema::ActOnMSAsmStmt(SourceLocation AsmLoc,
514 SourceLocation LBraceLoc,
515 ArrayRef<Token> AsmToks,
516 SourceLocation EndLoc) {
517 // MS-style inline assembly is not fully supported, so emit a warning.
518 Diag(AsmLoc, diag::warn_unsupported_msasm);
519 SmallVector<StringRef,4> Clobbers;
520 std::set<std::string> ClobberRegs;
521 SmallVector<IdentifierInfo*, 4> Inputs;
522 SmallVector<IdentifierInfo*, 4> Outputs;
523
524 // Empty asm statements don't need to instantiate the AsmParser, etc.
525 if (AsmToks.empty()) {
526 StringRef AsmString;
527 MSAsmStmt *NS =
528 new (Context) MSAsmStmt(Context, AsmLoc, LBraceLoc, /*IsSimple*/ true,
529 /*IsVolatile*/ true, AsmToks, Inputs, Outputs,
530 AsmString, Clobbers, EndLoc);
531 return Owned(NS);
532 }
533
534 unsigned NumAsmStrings;
Chad Rosier38c71d32012-08-21 21:56:39 +0000535 std::vector<std::string> AsmStrings;
536 std::string AsmString = buildMSAsmString(*this, AsmToks, AsmStrings);
537 NumAsmStrings = AsmStrings.size();
538
539 std::vector<std::vector<StringRef> > Pieces;
540 Pieces.resize(NumAsmStrings);
541 for (unsigned i = 0; i != NumAsmStrings; ++i)
542 buildMSAsmPieces(AsmStrings[i], Pieces[i]);
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000543
544 bool IsSimple;
545 std::vector<llvm::BitVector> Regs;
546 std::vector<llvm::BitVector> Names;
547 std::vector<std::string> PatchedAsmStrings;
548
549 Regs.resize(NumAsmStrings);
550 Names.resize(NumAsmStrings);
551 PatchedAsmStrings.resize(NumAsmStrings);
552
553 // Rewrite operands to appease the AsmParser.
554 patchMSAsmStrings(*this, IsSimple, AsmLoc, AsmToks,
555 Context.getTargetInfo(), Regs, Names, PatchedAsmStrings);
556
557 // patchMSAsmStrings doesn't correctly patch non-simple asm statements.
558 if (!IsSimple) {
559 MSAsmStmt *NS =
560 new (Context) MSAsmStmt(Context, AsmLoc, LBraceLoc, /*IsSimple*/ true,
561 /*IsVolatile*/ true, AsmToks, Inputs, Outputs,
562 AsmString, Clobbers, EndLoc);
563 return Owned(NS);
564 }
565
566 // Initialize targets and assembly printers/parsers.
567 llvm::InitializeAllTargetInfos();
568 llvm::InitializeAllTargetMCs();
569 llvm::InitializeAllAsmParsers();
570
571 // Get the target specific parser.
572 std::string Error;
573 const std::string &TT = Context.getTargetInfo().getTriple().getTriple();
574 const llvm::Target *TheTarget(llvm::TargetRegistry::lookupTarget(TT, Error));
575
576 OwningPtr<llvm::MCAsmInfo> MAI(TheTarget->createMCAsmInfo(TT));
577 OwningPtr<llvm::MCRegisterInfo> MRI(TheTarget->createMCRegInfo(TT));
578 OwningPtr<llvm::MCObjectFileInfo> MOFI(new llvm::MCObjectFileInfo());
579 OwningPtr<llvm::MCSubtargetInfo>
580 STI(TheTarget->createMCSubtargetInfo(TT, "", ""));
581
582 for (unsigned i = 0, e = PatchedAsmStrings.size(); i != e; ++i) {
583 llvm::SourceMgr SrcMgr;
584 llvm::MCContext Ctx(*MAI, *MRI, MOFI.get(), &SrcMgr);
585 llvm::MemoryBuffer *Buffer =
586 llvm::MemoryBuffer::getMemBuffer(PatchedAsmStrings[i], "<inline asm>");
587
588 // Tell SrcMgr about this buffer, which is what the parser will pick up.
589 SrcMgr.AddNewSourceBuffer(Buffer, llvm::SMLoc());
590
591 OwningPtr<llvm::MCStreamer> Str(createNullStreamer(Ctx));
592 OwningPtr<llvm::MCAsmParser>
593 Parser(createMCAsmParser(SrcMgr, Ctx, *Str.get(), *MAI));
594 OwningPtr<llvm::MCTargetAsmParser>
595 TargetParser(TheTarget->createMCAsmParser(*STI, *Parser));
596 // Change to the Intel dialect.
597 Parser->setAssemblerDialect(1);
598 Parser->setTargetParser(*TargetParser.get());
599
600 // Prime the lexer.
601 Parser->Lex();
602
603 // Parse the opcode.
604 StringRef IDVal;
605 Parser->ParseIdentifier(IDVal);
606
607 // Canonicalize the opcode to lower case.
608 SmallString<128> Opcode;
609 for (unsigned i = 0, e = IDVal.size(); i != e; ++i)
610 Opcode.push_back(tolower(IDVal[i]));
611
612 // Parse the operands.
613 llvm::SMLoc IDLoc;
614 SmallVector<llvm::MCParsedAsmOperand*, 8> Operands;
615 bool HadError = TargetParser->ParseInstruction(Opcode.str(), IDLoc,
616 Operands);
617 assert (!HadError && "Unexpected error parsing instruction");
618
619 // Match the MCInstr.
Chad Rosier83591b62012-08-21 18:15:08 +0000620 unsigned ErrorInfo;
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000621 SmallVector<llvm::MCInst, 2> Instrs;
Chad Rosier83591b62012-08-21 18:15:08 +0000622 HadError = TargetParser->MatchInstruction(IDLoc, Operands, Instrs,
Chad Rosier51a6b3f2012-08-21 19:37:55 +0000623 ErrorInfo,
624 /*matchingInlineAsm*/ true);
Chad Rosier4b5e48d2012-08-17 21:19:40 +0000625 assert (!HadError && "Unexpected error matching instruction");
626 assert ((Instrs.size() == 1) && "Expected only a single instruction.");
627
628 // Get the instruction descriptor.
629 llvm::MCInst Inst = Instrs[0];
630 const llvm::MCInstrInfo *MII = TheTarget->createMCInstrInfo();
631 const llvm::MCInstrDesc &Desc = MII->get(Inst.getOpcode());
632 llvm::MCInstPrinter *IP =
633 TheTarget->createMCInstPrinter(1, *MAI, *MII, *MRI, *STI);
634
635 // Build the list of clobbers.
636 for (unsigned i = 0, e = Desc.getNumDefs(); i != e; ++i) {
637 const llvm::MCOperand &Op = Inst.getOperand(i);
638 if (!Op.isReg())
639 continue;
640
641 std::string Reg;
642 llvm::raw_string_ostream OS(Reg);
643 IP->printRegName(OS, Op.getReg());
644
645 StringRef Clobber(OS.str());
646 if (!Context.getTargetInfo().isValidClobber(Clobber))
647 return StmtError(Diag(AsmLoc, diag::err_asm_unknown_register_name) <<
648 Clobber);
649 ClobberRegs.insert(Reg);
650 }
651 }
652 for (std::set<std::string>::iterator I = ClobberRegs.begin(),
653 E = ClobberRegs.end(); I != E; ++I)
654 Clobbers.push_back(*I);
655
656 MSAsmStmt *NS =
657 new (Context) MSAsmStmt(Context, AsmLoc, LBraceLoc, IsSimple,
658 /*IsVolatile*/ true, AsmToks, Inputs, Outputs,
659 AsmString, Clobbers, EndLoc);
660 return Owned(NS);
661}