| //===-- LLParser.h - Parser Class -------------------------------*- C++ -*-===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file defines the parser class for .ll files. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #ifndef LLVM_ASMPARSER_LLPARSER_H |
| #define LLVM_ASMPARSER_LLPARSER_H |
| |
| #include "LLLexer.h" |
| #include "llvm/Module.h" |
| #include "llvm/Type.h" |
| #include "llvm/ADT/DenseMap.h" |
| #include "llvm/Support/ValueHandle.h" |
| #include <map> |
| |
| namespace llvm { |
| class Module; |
| class OpaqueType; |
| class Function; |
| class Value; |
| class BasicBlock; |
| class Instruction; |
| class Constant; |
| class GlobalValue; |
| class MDString; |
| class MDNode; |
| |
| /// ValID - Represents a reference of a definition of some sort with no type. |
| /// There are several cases where we have to parse the value but where the |
| /// type can depend on later context. This may either be a numeric reference |
| /// or a symbolic (%var) reference. This is just a discriminated union. |
| struct ValID { |
| enum { |
| t_LocalID, t_GlobalID, // ID in UIntVal. |
| t_LocalName, t_GlobalName, // Name in StrVal. |
| t_APSInt, t_APFloat, // Value in APSIntVal/APFloatVal. |
| t_Null, t_Undef, t_Zero, // No value. |
| t_EmptyArray, // No value: [] |
| t_Constant, // Value in ConstantVal. |
| t_InlineAsm, // Value in StrVal/StrVal2/UIntVal. |
| t_MDNode, // Value in MDNodeVal. |
| t_MDString // Value in MDStringVal. |
| } Kind; |
| |
| LLLexer::LocTy Loc; |
| unsigned UIntVal; |
| std::string StrVal, StrVal2; |
| APSInt APSIntVal; |
| APFloat APFloatVal; |
| Constant *ConstantVal; |
| MDNode *MDNodeVal; |
| MDString *MDStringVal; |
| ValID() : APFloatVal(0.0) {} |
| |
| bool operator<(const ValID &RHS) const { |
| if (Kind == t_LocalID || Kind == t_GlobalID) |
| return UIntVal < RHS.UIntVal; |
| assert((Kind == t_LocalName || Kind == t_GlobalName) && |
| "Ordering not defined for this ValID kind yet"); |
| return StrVal < RHS.StrVal; |
| } |
| }; |
| |
| class LLParser { |
| public: |
| typedef LLLexer::LocTy LocTy; |
| private: |
| LLVMContext &Context; |
| LLLexer Lex; |
| Module *M; |
| |
| // Instruction metadata resolution. Each instruction can have a list of |
| // MDRef info associated with them. |
| // |
| // The simpler approach of just creating temporary MDNodes and then calling |
| // RAUW on them when the definition is processed doesn't work because some |
| // instruction metadata kinds, such as dbg, get stored in the IR in an |
| // "optimized" format which doesn't participate in the normal value use |
| // lists. This means that RAUW doesn't work, even on temporary MDNodes |
| // which otherwise support RAUW. Instead, we defer resolving MDNode |
| // references until the definitions have been processed. |
| struct MDRef { |
| SMLoc Loc; |
| unsigned MDKind, MDSlot; |
| }; |
| DenseMap<Instruction*, std::vector<MDRef> > ForwardRefInstMetadata; |
| |
| // Type resolution handling data structures. |
| std::map<std::string, std::pair<PATypeHolder, LocTy> > ForwardRefTypes; |
| std::map<unsigned, std::pair<PATypeHolder, LocTy> > ForwardRefTypeIDs; |
| std::vector<PATypeHolder> NumberedTypes; |
| std::vector<TrackingVH<MDNode> > NumberedMetadata; |
| std::map<unsigned, std::pair<TrackingVH<MDNode>, LocTy> > ForwardRefMDNodes; |
| struct UpRefRecord { |
| /// Loc - This is the location of the upref. |
| LocTy Loc; |
| |
| /// NestingLevel - The number of nesting levels that need to be popped |
| /// before this type is resolved. |
| unsigned NestingLevel; |
| |
| /// LastContainedTy - This is the type at the current binding level for |
| /// the type. Every time we reduce the nesting level, this gets updated. |
| const Type *LastContainedTy; |
| |
| /// UpRefTy - This is the actual opaque type that the upreference is |
| /// represented with. |
| OpaqueType *UpRefTy; |
| |
| UpRefRecord(LocTy L, unsigned NL, OpaqueType *URTy) |
| : Loc(L), NestingLevel(NL), LastContainedTy((Type*)URTy), |
| UpRefTy(URTy) {} |
| }; |
| std::vector<UpRefRecord> UpRefs; |
| |
| // Global Value reference information. |
| std::map<std::string, std::pair<GlobalValue*, LocTy> > ForwardRefVals; |
| std::map<unsigned, std::pair<GlobalValue*, LocTy> > ForwardRefValIDs; |
| std::vector<GlobalValue*> NumberedVals; |
| |
| // References to blockaddress. The key is the function ValID, the value is |
| // a list of references to blocks in that function. |
| std::map<ValID, std::vector<std::pair<ValID, GlobalValue*> > > |
| ForwardRefBlockAddresses; |
| |
| Function *MallocF; |
| public: |
| LLParser(MemoryBuffer *F, SourceMgr &SM, SMDiagnostic &Err, Module *m) : |
| Context(m->getContext()), Lex(F, SM, Err, m->getContext()), |
| M(m), MallocF(NULL) {} |
| bool Run(); |
| |
| LLVMContext& getContext() { return Context; } |
| |
| private: |
| |
| bool Error(LocTy L, const std::string &Msg) const { |
| return Lex.Error(L, Msg); |
| } |
| bool TokError(const std::string &Msg) const { |
| return Error(Lex.getLoc(), Msg); |
| } |
| |
| /// GetGlobalVal - Get a value with the specified name or ID, creating a |
| /// forward reference record if needed. This can return null if the value |
| /// exists but does not have the right type. |
| GlobalValue *GetGlobalVal(const std::string &N, const Type *Ty, LocTy Loc); |
| GlobalValue *GetGlobalVal(unsigned ID, const Type *Ty, LocTy Loc); |
| |
| // Helper Routines. |
| bool ParseToken(lltok::Kind T, const char *ErrMsg); |
| bool EatIfPresent(lltok::Kind T) { |
| if (Lex.getKind() != T) return false; |
| Lex.Lex(); |
| return true; |
| } |
| bool ParseOptionalToken(lltok::Kind T, bool &Present) { |
| if (Lex.getKind() != T) { |
| Present = false; |
| } else { |
| Lex.Lex(); |
| Present = true; |
| } |
| return false; |
| } |
| bool ParseStringConstant(std::string &Result); |
| bool ParseUInt32(unsigned &Val); |
| bool ParseUInt32(unsigned &Val, LocTy &Loc) { |
| Loc = Lex.getLoc(); |
| return ParseUInt32(Val); |
| } |
| bool ParseOptionalAddrSpace(unsigned &AddrSpace); |
| bool ParseOptionalAttrs(unsigned &Attrs, unsigned AttrKind); |
| bool ParseOptionalLinkage(unsigned &Linkage, bool &HasLinkage); |
| bool ParseOptionalLinkage(unsigned &Linkage) { |
| bool HasLinkage; return ParseOptionalLinkage(Linkage, HasLinkage); |
| } |
| bool ParseOptionalVisibility(unsigned &Visibility); |
| bool ParseOptionalCallingConv(CallingConv::ID &CC); |
| bool ParseOptionalAlignment(unsigned &Alignment); |
| bool ParseOptionalStackAlignment(unsigned &Alignment); |
| bool ParseOptionalCommaAlign(unsigned &Alignment, bool &AteExtraComma); |
| bool ParseIndexList(SmallVectorImpl<unsigned> &Indices,bool &AteExtraComma); |
| bool ParseIndexList(SmallVectorImpl<unsigned> &Indices) { |
| bool AteExtraComma; |
| if (ParseIndexList(Indices, AteExtraComma)) return true; |
| if (AteExtraComma) |
| return TokError("expected index"); |
| return false; |
| } |
| |
| // Top-Level Entities |
| bool ParseTopLevelEntities(); |
| bool ValidateEndOfModule(); |
| bool ParseTargetDefinition(); |
| bool ParseDepLibs(); |
| bool ParseModuleAsm(); |
| bool ParseUnnamedType(); |
| bool ParseNamedType(); |
| bool ParseDeclare(); |
| bool ParseDefine(); |
| |
| bool ParseGlobalType(bool &IsConstant); |
| bool ParseUnnamedGlobal(); |
| bool ParseNamedGlobal(); |
| bool ParseGlobal(const std::string &Name, LocTy Loc, unsigned Linkage, |
| bool HasLinkage, unsigned Visibility); |
| bool ParseAlias(const std::string &Name, LocTy Loc, unsigned Visibility); |
| bool ParseStandaloneMetadata(); |
| bool ParseNamedMetadata(); |
| bool ParseMDString(MDString *&Result); |
| bool ParseMDNodeID(MDNode *&Result); |
| bool ParseMDNodeID(MDNode *&Result, unsigned &SlotNo); |
| |
| // Type Parsing. |
| bool ParseType(PATypeHolder &Result, bool AllowVoid = false); |
| bool ParseType(PATypeHolder &Result, LocTy &Loc, bool AllowVoid = false) { |
| Loc = Lex.getLoc(); |
| return ParseType(Result, AllowVoid); |
| } |
| bool ParseTypeRec(PATypeHolder &H); |
| bool ParseStructType(PATypeHolder &H, bool Packed); |
| bool ParseArrayVectorType(PATypeHolder &H, bool isVector); |
| bool ParseFunctionType(PATypeHolder &Result); |
| PATypeHolder HandleUpRefs(const Type *Ty); |
| |
| // Function Semantic Analysis. |
| class PerFunctionState { |
| LLParser &P; |
| Function &F; |
| std::map<std::string, std::pair<Value*, LocTy> > ForwardRefVals; |
| std::map<unsigned, std::pair<Value*, LocTy> > ForwardRefValIDs; |
| std::vector<Value*> NumberedVals; |
| |
| /// FunctionNumber - If this is an unnamed function, this is the slot |
| /// number of it, otherwise it is -1. |
| int FunctionNumber; |
| public: |
| PerFunctionState(LLParser &p, Function &f, int FunctionNumber); |
| ~PerFunctionState(); |
| |
| Function &getFunction() const { return F; } |
| |
| bool FinishFunction(); |
| |
| /// GetVal - Get a value with the specified name or ID, creating a |
| /// forward reference record if needed. This can return null if the value |
| /// exists but does not have the right type. |
| Value *GetVal(const std::string &Name, const Type *Ty, LocTy Loc); |
| Value *GetVal(unsigned ID, const Type *Ty, LocTy Loc); |
| |
| /// SetInstName - After an instruction is parsed and inserted into its |
| /// basic block, this installs its name. |
| bool SetInstName(int NameID, const std::string &NameStr, LocTy NameLoc, |
| Instruction *Inst); |
| |
| /// GetBB - Get a basic block with the specified name or ID, creating a |
| /// forward reference record if needed. This can return null if the value |
| /// is not a BasicBlock. |
| BasicBlock *GetBB(const std::string &Name, LocTy Loc); |
| BasicBlock *GetBB(unsigned ID, LocTy Loc); |
| |
| /// DefineBB - Define the specified basic block, which is either named or |
| /// unnamed. If there is an error, this returns null otherwise it returns |
| /// the block being defined. |
| BasicBlock *DefineBB(const std::string &Name, LocTy Loc); |
| }; |
| |
| bool ConvertValIDToValue(const Type *Ty, ValID &ID, Value *&V, |
| PerFunctionState *PFS); |
| |
| bool ParseValue(const Type *Ty, Value *&V, PerFunctionState &PFS); |
| bool ParseValue(const Type *Ty, Value *&V, LocTy &Loc, |
| PerFunctionState &PFS) { |
| Loc = Lex.getLoc(); |
| return ParseValue(Ty, V, PFS); |
| } |
| |
| bool ParseTypeAndValue(Value *&V, PerFunctionState &PFS); |
| bool ParseTypeAndValue(Value *&V, LocTy &Loc, PerFunctionState &PFS) { |
| Loc = Lex.getLoc(); |
| return ParseTypeAndValue(V, PFS); |
| } |
| bool ParseTypeAndBasicBlock(BasicBlock *&BB, LocTy &Loc, |
| PerFunctionState &PFS); |
| bool ParseTypeAndBasicBlock(BasicBlock *&BB, PerFunctionState &PFS) { |
| LocTy Loc; |
| return ParseTypeAndBasicBlock(BB, Loc, PFS); |
| } |
| |
| |
| struct ParamInfo { |
| LocTy Loc; |
| Value *V; |
| unsigned Attrs; |
| ParamInfo(LocTy loc, Value *v, unsigned attrs) |
| : Loc(loc), V(v), Attrs(attrs) {} |
| }; |
| bool ParseParameterList(SmallVectorImpl<ParamInfo> &ArgList, |
| PerFunctionState &PFS); |
| |
| // Constant Parsing. |
| bool ParseValID(ValID &ID, PerFunctionState *PFS = NULL); |
| bool ParseGlobalValue(const Type *Ty, Constant *&V); |
| bool ParseGlobalTypeAndValue(Constant *&V); |
| bool ParseGlobalValueVector(SmallVectorImpl<Constant*> &Elts); |
| bool ParseMetadataListValue(ValID &ID, PerFunctionState *PFS); |
| bool ParseMetadataValue(ValID &ID, PerFunctionState *PFS); |
| bool ParseMDNodeVector(SmallVectorImpl<Value*> &, PerFunctionState *PFS); |
| bool ParseInstructionMetadata(Instruction *Inst, PerFunctionState *PFS); |
| |
| // Function Parsing. |
| struct ArgInfo { |
| LocTy Loc; |
| PATypeHolder Type; |
| unsigned Attrs; |
| std::string Name; |
| ArgInfo(LocTy L, PATypeHolder Ty, unsigned Attr, const std::string &N) |
| : Loc(L), Type(Ty), Attrs(Attr), Name(N) {} |
| }; |
| bool ParseArgumentList(std::vector<ArgInfo> &ArgList, |
| bool &isVarArg, bool inType); |
| bool ParseFunctionHeader(Function *&Fn, bool isDefine); |
| bool ParseFunctionBody(Function &Fn); |
| bool ParseBasicBlock(PerFunctionState &PFS); |
| |
| // Instruction Parsing. Each instruction parsing routine can return with a |
| // normal result, an error result, or return having eaten an extra comma. |
| enum InstResult { InstNormal = 0, InstError = 1, InstExtraComma = 2 }; |
| int ParseInstruction(Instruction *&Inst, BasicBlock *BB, |
| PerFunctionState &PFS); |
| bool ParseCmpPredicate(unsigned &Pred, unsigned Opc); |
| |
| int ParseRet(Instruction *&Inst, BasicBlock *BB, PerFunctionState &PFS); |
| bool ParseBr(Instruction *&Inst, PerFunctionState &PFS); |
| bool ParseSwitch(Instruction *&Inst, PerFunctionState &PFS); |
| bool ParseIndirectBr(Instruction *&Inst, PerFunctionState &PFS); |
| bool ParseInvoke(Instruction *&Inst, PerFunctionState &PFS); |
| |
| bool ParseArithmetic(Instruction *&I, PerFunctionState &PFS, unsigned Opc, |
| unsigned OperandType); |
| bool ParseLogical(Instruction *&I, PerFunctionState &PFS, unsigned Opc); |
| bool ParseCompare(Instruction *&I, PerFunctionState &PFS, unsigned Opc); |
| bool ParseCast(Instruction *&I, PerFunctionState &PFS, unsigned Opc); |
| bool ParseSelect(Instruction *&I, PerFunctionState &PFS); |
| bool ParseVA_Arg(Instruction *&I, PerFunctionState &PFS); |
| bool ParseExtractElement(Instruction *&I, PerFunctionState &PFS); |
| bool ParseInsertElement(Instruction *&I, PerFunctionState &PFS); |
| bool ParseShuffleVector(Instruction *&I, PerFunctionState &PFS); |
| int ParsePHI(Instruction *&I, PerFunctionState &PFS); |
| bool ParseCall(Instruction *&I, PerFunctionState &PFS, bool isTail); |
| int ParseAlloc(Instruction *&I, PerFunctionState &PFS, |
| BasicBlock *BB = 0, bool isAlloca = true); |
| bool ParseFree(Instruction *&I, PerFunctionState &PFS, BasicBlock *BB); |
| int ParseLoad(Instruction *&I, PerFunctionState &PFS, bool isVolatile); |
| int ParseStore(Instruction *&I, PerFunctionState &PFS, bool isVolatile); |
| bool ParseGetResult(Instruction *&I, PerFunctionState &PFS); |
| int ParseGetElementPtr(Instruction *&I, PerFunctionState &PFS); |
| int ParseExtractValue(Instruction *&I, PerFunctionState &PFS); |
| int ParseInsertValue(Instruction *&I, PerFunctionState &PFS); |
| |
| bool ResolveForwardRefBlockAddresses(Function *TheFn, |
| std::vector<std::pair<ValID, GlobalValue*> > &Refs, |
| PerFunctionState *PFS); |
| }; |
| } // End llvm namespace |
| |
| #endif |