LLParser.h revision a73523958d39ca10a322fd8b177104ebc2045130
1//===-- LLParser.h - Parser Class -------------------------------*- C++ -*-===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10//  This file defines the parser class for .ll files.
11//
12//===----------------------------------------------------------------------===//
13
14#ifndef LLVM_ASMPARSER_LLPARSER_H
15#define LLVM_ASMPARSER_LLPARSER_H
16
17#include "LLLexer.h"
18#include "llvm/Module.h"
19#include "llvm/Type.h"
20#include "llvm/Support/ValueHandle.h"
21#include <map>
22
23namespace llvm {
24  class Module;
25  class OpaqueType;
26  class Function;
27  class Value;
28  class BasicBlock;
29  class Instruction;
30  class Constant;
31  class GlobalValue;
32  class MetadataBase;
33  class MDString;
34  class MDNode;
35
36  /// ValID - Represents a reference of a definition of some sort with no type.
37  /// There are several cases where we have to parse the value but where the
38  /// type can depend on later context.  This may either be a numeric reference
39  /// or a symbolic (%var) reference.  This is just a discriminated union.
40  struct ValID {
41    enum {
42      t_LocalID, t_GlobalID,      // ID in UIntVal.
43      t_LocalName, t_GlobalName,  // Name in StrVal.
44      t_APSInt, t_APFloat,        // Value in APSIntVal/APFloatVal.
45      t_Null, t_Undef, t_Zero,    // No value.
46      t_EmptyArray,               // No value:  []
47      t_Constant,                 // Value in ConstantVal.
48      t_InlineAsm,                // Value in StrVal/StrVal2/UIntVal.
49      t_MDNode,                   // Value in MDNodeVal.
50      t_MDString                  // Value in MDStringVal.
51    } Kind;
52
53    LLLexer::LocTy Loc;
54    unsigned UIntVal;
55    std::string StrVal, StrVal2;
56    APSInt APSIntVal;
57    APFloat APFloatVal;
58    Constant *ConstantVal;
59    MDNode *MDNodeVal;
60    MDString *MDStringVal;
61    ValID() : APFloatVal(0.0) {}
62
63    bool operator<(const ValID &RHS) const {
64      if (Kind == t_LocalID || Kind == t_GlobalID)
65        return UIntVal < RHS.UIntVal;
66      assert((Kind == t_LocalName || Kind == t_GlobalName) &&
67             "Ordering not defined for this ValID kind yet");
68      return StrVal < RHS.StrVal;
69    }
70  };
71
72  class LLParser {
73  public:
74    typedef LLLexer::LocTy LocTy;
75  private:
76    LLVMContext& Context;
77    LLLexer Lex;
78    Module *M;
79
80    // Type resolution handling data structures.
81    std::map<std::string, std::pair<PATypeHolder, LocTy> > ForwardRefTypes;
82    std::map<unsigned, std::pair<PATypeHolder, LocTy> > ForwardRefTypeIDs;
83    std::vector<PATypeHolder> NumberedTypes;
84    /// MetadataCache - This map keeps track of parsed metadata constants.
85    std::map<unsigned, TrackingVH<MDNode> > MetadataCache;
86    std::map<unsigned, std::pair<TrackingVH<MDNode>, LocTy> > ForwardRefMDNodes;
87    SmallVector<std::pair<unsigned, MDNode *>, 2> MDsOnInst;
88    struct UpRefRecord {
89      /// Loc - This is the location of the upref.
90      LocTy Loc;
91
92      /// NestingLevel - The number of nesting levels that need to be popped
93      /// before this type is resolved.
94      unsigned NestingLevel;
95
96      /// LastContainedTy - This is the type at the current binding level for
97      /// the type.  Every time we reduce the nesting level, this gets updated.
98      const Type *LastContainedTy;
99
100      /// UpRefTy - This is the actual opaque type that the upreference is
101      /// represented with.
102      OpaqueType *UpRefTy;
103
104      UpRefRecord(LocTy L, unsigned NL, OpaqueType *URTy)
105        : Loc(L), NestingLevel(NL), LastContainedTy((Type*)URTy),
106          UpRefTy(URTy) {}
107    };
108    std::vector<UpRefRecord> UpRefs;
109
110    // Global Value reference information.
111    std::map<std::string, std::pair<GlobalValue*, LocTy> > ForwardRefVals;
112    std::map<unsigned, std::pair<GlobalValue*, LocTy> > ForwardRefValIDs;
113    std::vector<GlobalValue*> NumberedVals;
114
115    // References to blockaddress.  The key is the function ValID, the value is
116    // a list of references to blocks in that function.
117    std::map<ValID, std::vector<std::pair<ValID, GlobalValue*> > >
118      ForwardRefBlockAddresses;
119
120    Function *MallocF;
121  public:
122    LLParser(MemoryBuffer *F, SourceMgr &SM, SMDiagnostic &Err, Module *m) :
123      Context(m->getContext()), Lex(F, SM, Err, m->getContext()),
124      M(m), MallocF(NULL) {}
125    bool Run();
126
127    LLVMContext& getContext() { return Context; }
128
129  private:
130
131    bool Error(LocTy L, const std::string &Msg) const {
132      return Lex.Error(L, Msg);
133    }
134    bool TokError(const std::string &Msg) const {
135      return Error(Lex.getLoc(), Msg);
136    }
137
138    /// GetGlobalVal - Get a value with the specified name or ID, creating a
139    /// forward reference record if needed.  This can return null if the value
140    /// exists but does not have the right type.
141    GlobalValue *GetGlobalVal(const std::string &N, const Type *Ty, LocTy Loc);
142    GlobalValue *GetGlobalVal(unsigned ID, const Type *Ty, LocTy Loc);
143
144    // Helper Routines.
145    bool ParseToken(lltok::Kind T, const char *ErrMsg);
146    bool EatIfPresent(lltok::Kind T) {
147      if (Lex.getKind() != T) return false;
148      Lex.Lex();
149      return true;
150    }
151    bool ParseOptionalToken(lltok::Kind T, bool &Present) {
152      if (Lex.getKind() != T) {
153        Present = false;
154      } else {
155        Lex.Lex();
156        Present = true;
157      }
158      return false;
159    }
160    bool ParseStringConstant(std::string &Result);
161    bool ParseUInt32(unsigned &Val);
162    bool ParseUInt32(unsigned &Val, LocTy &Loc) {
163      Loc = Lex.getLoc();
164      return ParseUInt32(Val);
165    }
166    bool ParseOptionalAddrSpace(unsigned &AddrSpace);
167    bool ParseOptionalAttrs(unsigned &Attrs, unsigned AttrKind);
168    bool ParseOptionalLinkage(unsigned &Linkage, bool &HasLinkage);
169    bool ParseOptionalLinkage(unsigned &Linkage) {
170      bool HasLinkage; return ParseOptionalLinkage(Linkage, HasLinkage);
171    }
172    bool ParseOptionalVisibility(unsigned &Visibility);
173    bool ParseOptionalCallingConv(CallingConv::ID &CC);
174    bool ParseOptionalAlignment(unsigned &Alignment);
175    bool ParseOptionalCustomMetadata();
176    bool ParseOptionalInfo(unsigned &Alignment);
177    bool ParseIndexList(SmallVectorImpl<unsigned> &Indices);
178
179    // Top-Level Entities
180    bool ParseTopLevelEntities();
181    bool ValidateEndOfModule();
182    bool ParseTargetDefinition();
183    bool ParseDepLibs();
184    bool ParseModuleAsm();
185    bool ParseUnnamedType();
186    bool ParseNamedType();
187    bool ParseDeclare();
188    bool ParseDefine();
189
190    bool ParseGlobalType(bool &IsConstant);
191    bool ParseUnnamedGlobal();
192    bool ParseNamedGlobal();
193    bool ParseGlobal(const std::string &Name, LocTy Loc, unsigned Linkage,
194                     bool HasLinkage, unsigned Visibility);
195    bool ParseAlias(const std::string &Name, LocTy Loc, unsigned Visibility);
196    bool ParseStandaloneMetadata();
197    bool ParseNamedMetadata();
198    bool ParseMDString(MDString *&Result);
199    bool ParseMDNodeID(MDNode *&Result);
200
201    // Type Parsing.
202    bool ParseType(PATypeHolder &Result, bool AllowVoid = false);
203    bool ParseType(PATypeHolder &Result, LocTy &Loc, bool AllowVoid = false) {
204      Loc = Lex.getLoc();
205      return ParseType(Result, AllowVoid);
206    }
207    bool ParseTypeRec(PATypeHolder &H);
208    bool ParseStructType(PATypeHolder &H, bool Packed);
209    bool ParseArrayVectorType(PATypeHolder &H, bool isVector);
210    bool ParseFunctionType(PATypeHolder &Result);
211    PATypeHolder HandleUpRefs(const Type *Ty);
212
213    // Constants.
214    bool ParseValID(ValID &ID);
215    bool ConvertGlobalValIDToValue(const Type *Ty, ValID &ID, Constant *&V);
216    bool ConvertGlobalOrMetadataValIDToValue(const Type *Ty, ValID &ID,
217                                             Value *&V);
218    bool ParseGlobalValue(const Type *Ty, Constant *&V);
219    bool ParseGlobalTypeAndValue(Constant *&V);
220    bool ParseGlobalValueVector(SmallVectorImpl<Constant*> &Elts);
221    bool ParseMDNodeVector(SmallVectorImpl<Value*> &);
222
223
224    // Function Semantic Analysis.
225    class PerFunctionState {
226      LLParser &P;
227      Function &F;
228      std::map<std::string, std::pair<Value*, LocTy> > ForwardRefVals;
229      std::map<unsigned, std::pair<Value*, LocTy> > ForwardRefValIDs;
230      std::vector<Value*> NumberedVals;
231
232      /// FunctionNumber - If this is an unnamed function, this is the slot
233      /// number of it, otherwise it is -1.
234      int FunctionNumber;
235    public:
236      PerFunctionState(LLParser &p, Function &f, int FunctionNumber);
237      ~PerFunctionState();
238
239      Function &getFunction() const { return F; }
240
241      bool FinishFunction();
242
243      /// GetVal - Get a value with the specified name or ID, creating a
244      /// forward reference record if needed.  This can return null if the value
245      /// exists but does not have the right type.
246      Value *GetVal(const std::string &Name, const Type *Ty, LocTy Loc);
247      Value *GetVal(unsigned ID, const Type *Ty, LocTy Loc);
248
249      /// SetInstName - After an instruction is parsed and inserted into its
250      /// basic block, this installs its name.
251      bool SetInstName(int NameID, const std::string &NameStr, LocTy NameLoc,
252                       Instruction *Inst);
253
254      /// GetBB - Get a basic block with the specified name or ID, creating a
255      /// forward reference record if needed.  This can return null if the value
256      /// is not a BasicBlock.
257      BasicBlock *GetBB(const std::string &Name, LocTy Loc);
258      BasicBlock *GetBB(unsigned ID, LocTy Loc);
259
260      /// DefineBB - Define the specified basic block, which is either named or
261      /// unnamed.  If there is an error, this returns null otherwise it returns
262      /// the block being defined.
263      BasicBlock *DefineBB(const std::string &Name, LocTy Loc);
264    };
265
266    bool ConvertValIDToValue(const Type *Ty, ValID &ID, Value *&V,
267                             PerFunctionState &PFS);
268
269    bool ParseValue(const Type *Ty, Value *&V, PerFunctionState &PFS);
270    bool ParseValue(const Type *Ty, Value *&V, LocTy &Loc,
271                    PerFunctionState &PFS) {
272      Loc = Lex.getLoc();
273      return ParseValue(Ty, V, PFS);
274    }
275
276    bool ParseTypeAndValue(Value *&V, PerFunctionState &PFS);
277    bool ParseTypeAndValue(Value *&V, LocTy &Loc, PerFunctionState &PFS) {
278      Loc = Lex.getLoc();
279      return ParseTypeAndValue(V, PFS);
280    }
281    bool ParseTypeAndBasicBlock(BasicBlock *&BB, LocTy &Loc,
282                                PerFunctionState &PFS);
283    bool ParseTypeAndBasicBlock(BasicBlock *&BB, PerFunctionState &PFS) {
284      LocTy Loc;
285      return ParseTypeAndBasicBlock(BB, Loc, PFS);
286    }
287
288    struct ParamInfo {
289      LocTy Loc;
290      Value *V;
291      unsigned Attrs;
292      ParamInfo(LocTy loc, Value *v, unsigned attrs)
293        : Loc(loc), V(v), Attrs(attrs) {}
294    };
295    bool ParseParameterList(SmallVectorImpl<ParamInfo> &ArgList,
296                            PerFunctionState &PFS);
297
298    // Function Parsing.
299    struct ArgInfo {
300      LocTy Loc;
301      PATypeHolder Type;
302      unsigned Attrs;
303      std::string Name;
304      ArgInfo(LocTy L, PATypeHolder Ty, unsigned Attr, const std::string &N)
305        : Loc(L), Type(Ty), Attrs(Attr), Name(N) {}
306    };
307    bool ParseArgumentList(std::vector<ArgInfo> &ArgList,
308                           bool &isVarArg, bool inType);
309    bool ParseFunctionHeader(Function *&Fn, bool isDefine);
310    bool ParseFunctionBody(Function &Fn);
311    bool ParseBasicBlock(PerFunctionState &PFS);
312
313    // Instruction Parsing.
314    bool ParseInstruction(Instruction *&Inst, BasicBlock *BB,
315                          PerFunctionState &PFS);
316    bool ParseCmpPredicate(unsigned &Pred, unsigned Opc);
317
318    bool ParseRet(Instruction *&Inst, BasicBlock *BB, PerFunctionState &PFS);
319    bool ParseBr(Instruction *&Inst, PerFunctionState &PFS);
320    bool ParseSwitch(Instruction *&Inst, PerFunctionState &PFS);
321    bool ParseIndirectBr(Instruction *&Inst, PerFunctionState &PFS);
322    bool ParseInvoke(Instruction *&Inst, PerFunctionState &PFS);
323
324    bool ParseArithmetic(Instruction *&I, PerFunctionState &PFS, unsigned Opc,
325                         unsigned OperandType);
326    bool ParseLogical(Instruction *&I, PerFunctionState &PFS, unsigned Opc);
327    bool ParseCompare(Instruction *&I, PerFunctionState &PFS, unsigned Opc);
328    bool ParseCast(Instruction *&I, PerFunctionState &PFS, unsigned Opc);
329    bool ParseSelect(Instruction *&I, PerFunctionState &PFS);
330    bool ParseVA_Arg(Instruction *&I, PerFunctionState &PFS);
331    bool ParseExtractElement(Instruction *&I, PerFunctionState &PFS);
332    bool ParseInsertElement(Instruction *&I, PerFunctionState &PFS);
333    bool ParseShuffleVector(Instruction *&I, PerFunctionState &PFS);
334    bool ParsePHI(Instruction *&I, PerFunctionState &PFS);
335    bool ParseCall(Instruction *&I, PerFunctionState &PFS, bool isTail);
336    bool ParseAlloc(Instruction *&I, PerFunctionState &PFS,
337                    BasicBlock *BB = 0, bool isAlloca = true);
338    bool ParseFree(Instruction *&I, PerFunctionState &PFS, BasicBlock *BB);
339    bool ParseLoad(Instruction *&I, PerFunctionState &PFS, bool isVolatile);
340    bool ParseStore(Instruction *&I, PerFunctionState &PFS, bool isVolatile);
341    bool ParseGetResult(Instruction *&I, PerFunctionState &PFS);
342    bool ParseGetElementPtr(Instruction *&I, PerFunctionState &PFS);
343    bool ParseExtractValue(Instruction *&I, PerFunctionState &PFS);
344    bool ParseInsertValue(Instruction *&I, PerFunctionState &PFS);
345
346    bool ResolveForwardRefBlockAddresses(Function *TheFn,
347                             std::vector<std::pair<ValID, GlobalValue*> > &Refs,
348                                         PerFunctionState *PFS);
349  };
350} // End llvm namespace
351
352#endif
353