1 //===-- llvmAsmParser.y - Parser for llvm assembly files ---------*- C++ -*--=//
3 // This file implements the bison parser for LLVM assembly languages files.
5 //===------------------------------------------------------------------------=//
8 #include "ParserInternals.h"
9 #include "llvm/SymbolTable.h"
10 #include "llvm/Module.h"
11 #include "llvm/iTerminators.h"
12 #include "llvm/iMemory.h"
13 #include "llvm/iOperators.h"
14 #include "llvm/iPHINode.h"
15 #include "Support/STLExtras.h"
16 #include "Support/DepthFirstIterator.h"
21 int yyerror(const char *ErrorMsg); // Forward declarations to prevent "implicit
22 int yylex(); // declaration" of xxx warnings.
25 static Module *ParserResult;
26 std::string CurFilename;
28 // DEBUG_UPREFS - Define this symbol if you want to enable debugging output
29 // relating to upreferences in the input stream.
31 //#define DEBUG_UPREFS 1
33 #define UR_OUT(X) std::cerr << X
38 #define YYERROR_VERBOSE 1
40 // This contains info used when building the body of a function. It is
41 // destroyed when the function is completed.
43 typedef std::vector<Value *> ValueList; // Numbered defs
44 static void ResolveDefinitions(std::vector<ValueList> &LateResolvers,
45 std::vector<ValueList> *FutureLateResolvers = 0);
47 static struct PerModuleInfo {
48 Module *CurrentModule;
49 std::vector<ValueList> Values; // Module level numbered definitions
50 std::vector<ValueList> LateResolveValues;
51 std::vector<PATypeHolder> Types;
52 std::map<ValID, PATypeHolder> LateResolveTypes;
54 // GlobalRefs - This maintains a mapping between <Type, ValID>'s and forward
55 // references to global values. Global values may be referenced before they
56 // are defined, and if so, the temporary object that they represent is held
57 // here. This is used for forward references of ConstantPointerRefs.
59 typedef std::map<std::pair<const PointerType *,
60 ValID>, GlobalVariable*> GlobalRefsType;
61 GlobalRefsType GlobalRefs;
64 // If we could not resolve some functions at function compilation time
65 // (calls to functions before they are defined), resolve them now... Types
66 // are resolved when the constant pool has been completely parsed.
68 ResolveDefinitions(LateResolveValues);
70 // Check to make sure that all global value forward references have been
73 if (!GlobalRefs.empty()) {
74 std::string UndefinedReferences = "Unresolved global references exist:\n";
76 for (GlobalRefsType::iterator I = GlobalRefs.begin(), E =GlobalRefs.end();
78 UndefinedReferences += " " + I->first.first->getDescription() + " " +
79 I->first.second.getName() + "\n";
81 ThrowException(UndefinedReferences);
84 Values.clear(); // Clear out function local definitions
90 // DeclareNewGlobalValue - Called every time a new GV has been defined. This
91 // is used to remove things from the forward declaration map, resolving them
92 // to the correct thing as needed.
94 void DeclareNewGlobalValue(GlobalValue *GV, ValID D) {
95 // Check to see if there is a forward reference to this global variable...
96 // if there is, eliminate it and patch the reference to use the new def'n.
97 GlobalRefsType::iterator I =
98 GlobalRefs.find(std::make_pair(GV->getType(), D));
100 if (I != GlobalRefs.end()) {
101 GlobalVariable *OldGV = I->second; // Get the placeholder...
102 I->first.second.destroy(); // Free string memory if necessary
104 // Loop over all of the uses of the GlobalValue. The only thing they are
105 // allowed to be is ConstantPointerRef's.
106 assert(OldGV->use_size() == 1 && "Only one reference should exist!");
107 User *U = OldGV->use_back(); // Must be a ConstantPointerRef...
108 ConstantPointerRef *CPR = cast<ConstantPointerRef>(U);
110 // Change the const pool reference to point to the real global variable
111 // now. This should drop a use from the OldGV.
112 CPR->mutateReferences(OldGV, GV);
113 assert(OldGV->use_empty() && "All uses should be gone now!");
115 // Remove OldGV from the module...
116 CurrentModule->getGlobalList().remove(OldGV);
117 delete OldGV; // Delete the old placeholder
119 // Remove the map entry for the global now that it has been created...
126 static struct PerFunctionInfo {
127 Function *CurrentFunction; // Pointer to current function being created
129 std::vector<ValueList> Values; // Keep track of numbered definitions
130 std::vector<ValueList> LateResolveValues;
131 std::vector<PATypeHolder> Types;
132 std::map<ValID, PATypeHolder> LateResolveTypes;
133 bool isDeclare; // Is this function a forward declararation?
135 inline PerFunctionInfo() {
140 inline ~PerFunctionInfo() {}
142 inline void FunctionStart(Function *M) {
146 void FunctionDone() {
147 // If we could not resolve some blocks at parsing time (forward branches)
148 // resolve the branches now...
149 ResolveDefinitions(LateResolveValues, &CurModule.LateResolveValues);
151 // Make sure to resolve any constant expr references that might exist within
152 // the function we just declared itself.
154 if (CurrentFunction->hasName()) {
155 FID = ValID::create((char*)CurrentFunction->getName().c_str());
157 unsigned Slot = CurrentFunction->getType()->getUniqueID();
158 assert(CurModule.Values.size() > Slot && "Function not inserted?");
159 // Figure out which slot number if is...
160 for (unsigned i = 0; ; ++i) {
161 assert(i < CurModule.Values[Slot].size() && "Function not found!");
162 if (CurModule.Values[Slot][i] == CurrentFunction) {
163 FID = ValID::create((int)i);
168 CurModule.DeclareNewGlobalValue(CurrentFunction, FID);
170 Values.clear(); // Clear out function local definitions
175 } CurMeth; // Info for the current function...
177 static bool inFunctionScope() { return CurMeth.CurrentFunction != 0; }
180 //===----------------------------------------------------------------------===//
181 // Code to handle definitions of all the types
182 //===----------------------------------------------------------------------===//
184 static int InsertValue(Value *D,
185 std::vector<ValueList> &ValueTab = CurMeth.Values) {
186 if (D->hasName()) return -1; // Is this a numbered definition?
188 // Yes, insert the value into the value table...
189 unsigned type = D->getType()->getUniqueID();
190 if (ValueTab.size() <= type)
191 ValueTab.resize(type+1, ValueList());
192 //printf("Values[%d][%d] = %d\n", type, ValueTab[type].size(), D);
193 ValueTab[type].push_back(D);
194 return ValueTab[type].size()-1;
197 // TODO: FIXME when Type are not const
198 static void InsertType(const Type *Ty, std::vector<PATypeHolder> &Types) {
202 static const Type *getTypeVal(const ValID &D, bool DoNotImprovise = false) {
204 case ValID::NumberVal: { // Is it a numbered definition?
205 unsigned Num = (unsigned)D.Num;
207 // Module constants occupy the lowest numbered slots...
208 if (Num < CurModule.Types.size())
209 return CurModule.Types[Num];
211 Num -= CurModule.Types.size();
213 // Check that the number is within bounds...
214 if (Num <= CurMeth.Types.size())
215 return CurMeth.Types[Num];
218 case ValID::NameVal: { // Is it a named definition?
219 std::string Name(D.Name);
220 SymbolTable *SymTab = 0;
222 if (inFunctionScope()) {
223 SymTab = &CurMeth.CurrentFunction->getSymbolTable();
224 N = SymTab->lookup(Type::TypeTy, Name);
228 // Symbol table doesn't automatically chain yet... because the function
229 // hasn't been added to the module...
231 SymTab = &CurModule.CurrentModule->getSymbolTable();
232 N = SymTab->lookup(Type::TypeTy, Name);
236 D.destroy(); // Free old strdup'd memory...
237 return cast<Type>(N);
240 ThrowException("Internal parser error: Invalid symbol type reference!");
243 // If we reached here, we referenced either a symbol that we don't know about
244 // or an id number that hasn't been read yet. We may be referencing something
245 // forward, so just create an entry to be resolved later and get to it...
247 if (DoNotImprovise) return 0; // Do we just want a null to be returned?
249 std::map<ValID, PATypeHolder> &LateResolver = inFunctionScope() ?
250 CurMeth.LateResolveTypes : CurModule.LateResolveTypes;
252 std::map<ValID, PATypeHolder>::iterator I = LateResolver.find(D);
253 if (I != LateResolver.end()) {
257 Type *Typ = OpaqueType::get();
258 LateResolver.insert(std::make_pair(D, Typ));
262 static Value *lookupInSymbolTable(const Type *Ty, const std::string &Name) {
263 SymbolTable &SymTab =
264 inFunctionScope() ? CurMeth.CurrentFunction->getSymbolTable() :
265 CurModule.CurrentModule->getSymbolTable();
266 return SymTab.lookup(Ty, Name);
269 // getValNonImprovising - Look up the value specified by the provided type and
270 // the provided ValID. If the value exists and has already been defined, return
271 // it. Otherwise return null.
273 static Value *getValNonImprovising(const Type *Ty, const ValID &D) {
274 if (isa<FunctionType>(Ty))
275 ThrowException("Functions are not values and "
276 "must be referenced as pointers");
279 case ValID::NumberVal: { // Is it a numbered definition?
280 unsigned type = Ty->getUniqueID();
281 unsigned Num = (unsigned)D.Num;
283 // Module constants occupy the lowest numbered slots...
284 if (type < CurModule.Values.size()) {
285 if (Num < CurModule.Values[type].size())
286 return CurModule.Values[type][Num];
288 Num -= CurModule.Values[type].size();
291 // Make sure that our type is within bounds
292 if (CurMeth.Values.size() <= type) return 0;
294 // Check that the number is within bounds...
295 if (CurMeth.Values[type].size() <= Num) return 0;
297 return CurMeth.Values[type][Num];
300 case ValID::NameVal: { // Is it a named definition?
301 Value *N = lookupInSymbolTable(Ty, std::string(D.Name));
302 if (N == 0) return 0;
304 D.destroy(); // Free old strdup'd memory...
308 // Check to make sure that "Ty" is an integral type, and that our
309 // value will fit into the specified type...
310 case ValID::ConstSIntVal: // Is it a constant pool reference??
311 if (!ConstantSInt::isValueValidForType(Ty, D.ConstPool64))
312 ThrowException("Signed integral constant '" +
313 itostr(D.ConstPool64) + "' is invalid for type '" +
314 Ty->getDescription() + "'!");
315 return ConstantSInt::get(Ty, D.ConstPool64);
317 case ValID::ConstUIntVal: // Is it an unsigned const pool reference?
318 if (!ConstantUInt::isValueValidForType(Ty, D.UConstPool64)) {
319 if (!ConstantSInt::isValueValidForType(Ty, D.ConstPool64)) {
320 ThrowException("Integral constant '" + utostr(D.UConstPool64) +
321 "' is invalid or out of range!");
322 } else { // This is really a signed reference. Transmogrify.
323 return ConstantSInt::get(Ty, D.ConstPool64);
326 return ConstantUInt::get(Ty, D.UConstPool64);
329 case ValID::ConstFPVal: // Is it a floating point const pool reference?
330 if (!ConstantFP::isValueValidForType(Ty, D.ConstPoolFP))
331 ThrowException("FP constant invalid for type!!");
332 return ConstantFP::get(Ty, D.ConstPoolFP);
334 case ValID::ConstNullVal: // Is it a null value?
335 if (!isa<PointerType>(Ty))
336 ThrowException("Cannot create a a non pointer null!");
337 return ConstantPointerNull::get(cast<PointerType>(Ty));
339 case ValID::ConstantVal: // Fully resolved constant?
340 if (D.ConstantValue->getType() != Ty)
341 ThrowException("Constant expression type different from required type!");
342 return D.ConstantValue;
345 assert(0 && "Unhandled case!");
349 assert(0 && "Unhandled case!");
354 // getVal - This function is identical to getValNonImprovising, except that if a
355 // value is not already defined, it "improvises" by creating a placeholder var
356 // that looks and acts just like the requested variable. When the value is
357 // defined later, all uses of the placeholder variable are replaced with the
360 static Value *getVal(const Type *Ty, const ValID &D) {
361 assert(Ty != Type::TypeTy && "Should use getTypeVal for types!");
363 // See if the value has already been defined...
364 Value *V = getValNonImprovising(Ty, D);
367 // If we reached here, we referenced either a symbol that we don't know about
368 // or an id number that hasn't been read yet. We may be referencing something
369 // forward, so just create an entry to be resolved later and get to it...
372 switch (Ty->getPrimitiveID()) {
373 case Type::LabelTyID: d = new BBPlaceHolder(Ty, D); break;
374 default: d = new ValuePlaceHolder(Ty, D); break;
377 assert(d != 0 && "How did we not make something?");
378 if (inFunctionScope())
379 InsertValue(d, CurMeth.LateResolveValues);
381 InsertValue(d, CurModule.LateResolveValues);
386 //===----------------------------------------------------------------------===//
387 // Code to handle forward references in instructions
388 //===----------------------------------------------------------------------===//
390 // This code handles the late binding needed with statements that reference
391 // values not defined yet... for example, a forward branch, or the PHI node for
394 // This keeps a table (CurMeth.LateResolveValues) of all such forward references
395 // and back patchs after we are done.
398 // ResolveDefinitions - If we could not resolve some defs at parsing
399 // time (forward branches, phi functions for loops, etc...) resolve the
402 static void ResolveDefinitions(std::vector<ValueList> &LateResolvers,
403 std::vector<ValueList> *FutureLateResolvers) {
404 // Loop over LateResolveDefs fixing up stuff that couldn't be resolved
405 for (unsigned ty = 0; ty < LateResolvers.size(); ty++) {
406 while (!LateResolvers[ty].empty()) {
407 Value *V = LateResolvers[ty].back();
408 assert(!isa<Type>(V) && "Types should be in LateResolveTypes!");
410 LateResolvers[ty].pop_back();
411 ValID &DID = getValIDFromPlaceHolder(V);
413 Value *TheRealValue = getValNonImprovising(Type::getUniqueIDType(ty),DID);
415 V->replaceAllUsesWith(TheRealValue);
417 } else if (FutureLateResolvers) {
418 // Functions have their unresolved items forwarded to the module late
420 InsertValue(V, *FutureLateResolvers);
422 if (DID.Type == ValID::NameVal)
423 ThrowException("Reference to an invalid definition: '" +DID.getName()+
424 "' of type '" + V->getType()->getDescription() + "'",
425 getLineNumFromPlaceHolder(V));
427 ThrowException("Reference to an invalid definition: #" +
428 itostr(DID.Num) + " of type '" +
429 V->getType()->getDescription() + "'",
430 getLineNumFromPlaceHolder(V));
435 LateResolvers.clear();
438 // ResolveTypeTo - A brand new type was just declared. This means that (if
439 // name is not null) things referencing Name can be resolved. Otherwise, things
440 // refering to the number can be resolved. Do this now.
442 static void ResolveTypeTo(char *Name, const Type *ToTy) {
443 std::vector<PATypeHolder> &Types = inFunctionScope() ?
444 CurMeth.Types : CurModule.Types;
447 if (Name) D = ValID::create(Name);
448 else D = ValID::create((int)Types.size());
450 std::map<ValID, PATypeHolder> &LateResolver = inFunctionScope() ?
451 CurMeth.LateResolveTypes : CurModule.LateResolveTypes;
453 std::map<ValID, PATypeHolder>::iterator I = LateResolver.find(D);
454 if (I != LateResolver.end()) {
455 ((DerivedType*)I->second.get())->refineAbstractTypeTo(ToTy);
456 LateResolver.erase(I);
460 // ResolveTypes - At this point, all types should be resolved. Any that aren't
463 static void ResolveTypes(std::map<ValID, PATypeHolder> &LateResolveTypes) {
464 if (!LateResolveTypes.empty()) {
465 const ValID &DID = LateResolveTypes.begin()->first;
467 if (DID.Type == ValID::NameVal)
468 ThrowException("Reference to an invalid type: '" +DID.getName() + "'");
470 ThrowException("Reference to an invalid type: #" + itostr(DID.Num));
475 // setValueName - Set the specified value to the name given. The name may be
476 // null potentially, in which case this is a noop. The string passed in is
477 // assumed to be a malloc'd string buffer, and is freed by this function.
479 // This function returns true if the value has already been defined, but is
480 // allowed to be redefined in the specified context. If the name is a new name
481 // for the typeplane, false is returned.
483 static bool setValueName(Value *V, char *NameStr) {
484 if (NameStr == 0) return false;
486 std::string Name(NameStr); // Copy string
487 free(NameStr); // Free old string
489 if (V->getType() == Type::VoidTy)
490 ThrowException("Can't assign name '" + Name +
491 "' to a null valued instruction!");
493 SymbolTable &ST = inFunctionScope() ?
494 CurMeth.CurrentFunction->getSymbolTable() :
495 CurModule.CurrentModule->getSymbolTable();
497 Value *Existing = ST.lookup(V->getType(), Name);
498 if (Existing) { // Inserting a name that is already defined???
499 // There is only one case where this is allowed: when we are refining an
500 // opaque type. In this case, Existing will be an opaque type.
501 if (const Type *Ty = dyn_cast<Type>(Existing)) {
502 if (const OpaqueType *OpTy = dyn_cast<OpaqueType>(Ty)) {
503 // We ARE replacing an opaque type!
504 ((OpaqueType*)OpTy)->refineAbstractTypeTo(cast<Type>(V));
509 // Otherwise, we are a simple redefinition of a value, check to see if it
510 // is defined the same as the old one...
511 if (const Type *Ty = dyn_cast<Type>(Existing)) {
512 if (Ty == cast<Type>(V)) return true; // Yes, it's equal.
513 // std::cerr << "Type: " << Ty->getDescription() << " != "
514 // << cast<Type>(V)->getDescription() << "!\n";
515 } else if (const Constant *C = dyn_cast<Constant>(Existing)) {
516 if (C == V) return true; // Constants are equal to themselves
517 } else if (GlobalVariable *EGV = dyn_cast<GlobalVariable>(Existing)) {
518 // We are allowed to redefine a global variable in two circumstances:
519 // 1. If at least one of the globals is uninitialized or
520 // 2. If both initializers have the same value.
522 if (GlobalVariable *GV = dyn_cast<GlobalVariable>(V)) {
523 if (!EGV->hasInitializer() || !GV->hasInitializer() ||
524 EGV->getInitializer() == GV->getInitializer()) {
526 // Make sure the existing global version gets the initializer! Make
527 // sure that it also gets marked const if the new version is.
528 if (GV->hasInitializer() && !EGV->hasInitializer())
529 EGV->setInitializer(GV->getInitializer());
530 if (GV->isConstant())
531 EGV->setConstant(true);
532 EGV->setLinkage(GV->getLinkage());
534 delete GV; // Destroy the duplicate!
535 return true; // They are equivalent!
539 ThrowException("Redefinition of value named '" + Name + "' in the '" +
540 V->getType()->getDescription() + "' type plane!");
543 V->setName(Name, &ST);
548 //===----------------------------------------------------------------------===//
549 // Code for handling upreferences in type names...
552 // TypeContains - Returns true if Ty contains E in it.
554 static bool TypeContains(const Type *Ty, const Type *E) {
555 return find(df_begin(Ty), df_end(Ty), E) != df_end(Ty);
559 static std::vector<std::pair<unsigned, OpaqueType *> > UpRefs;
561 static PATypeHolder HandleUpRefs(const Type *ty) {
563 UR_OUT("Type '" << ty->getDescription() <<
564 "' newly formed. Resolving upreferences.\n" <<
565 UpRefs.size() << " upreferences active!\n");
566 for (unsigned i = 0; i < UpRefs.size(); ) {
567 UR_OUT(" UR#" << i << " - TypeContains(" << Ty->getDescription() << ", "
568 << UpRefs[i].second->getDescription() << ") = "
569 << (TypeContains(Ty, UpRefs[i].second) ? "true" : "false") << endl);
570 if (TypeContains(Ty, UpRefs[i].second)) {
571 unsigned Level = --UpRefs[i].first; // Decrement level of upreference
572 UR_OUT(" Uplevel Ref Level = " << Level << endl);
573 if (Level == 0) { // Upreference should be resolved!
574 UR_OUT(" * Resolving upreference for "
575 << UpRefs[i].second->getDescription() << endl;
576 std::string OldName = UpRefs[i].second->getDescription());
577 UpRefs[i].second->refineAbstractTypeTo(Ty);
578 UpRefs.erase(UpRefs.begin()+i); // Remove from upreference list...
579 UR_OUT(" * Type '" << OldName << "' refined upreference to: "
580 << (const void*)Ty << ", " << Ty->getDescription() << endl);
585 ++i; // Otherwise, no resolve, move on...
587 // FIXME: TODO: this should return the updated type
592 //===----------------------------------------------------------------------===//
593 // RunVMAsmParser - Define an interface to this parser
594 //===----------------------------------------------------------------------===//
596 Module *RunVMAsmParser(const std::string &Filename, FILE *F) {
598 CurFilename = Filename;
599 llvmAsmlineno = 1; // Reset the current line number...
601 // Allocate a new module to read
602 CurModule.CurrentModule = new Module(Filename);
603 yyparse(); // Parse the file.
604 Module *Result = ParserResult;
605 llvmAsmin = stdin; // F is about to go away, don't use it anymore...
615 Function *FunctionVal;
616 std::pair<PATypeHolder*, char*> *ArgVal;
617 BasicBlock *BasicBlockVal;
618 TerminatorInst *TermInstVal;
619 Instruction *InstVal;
622 const Type *PrimType;
623 PATypeHolder *TypeVal;
626 std::vector<std::pair<PATypeHolder*,char*> > *ArgList;
627 std::vector<Value*> *ValueList;
628 std::list<PATypeHolder> *TypeList;
629 std::list<std::pair<Value*,
630 BasicBlock*> > *PHIList; // Represent the RHS of PHI node
631 std::vector<std::pair<Constant*, BasicBlock*> > *JumpTable;
632 std::vector<Constant*> *ConstVector;
634 GlobalValue::LinkageTypes Linkage;
642 char *StrVal; // This memory is strdup'd!
643 ValID ValIDVal; // strdup'd memory maybe!
645 Instruction::BinaryOps BinaryOpVal;
646 Instruction::TermOps TermOpVal;
647 Instruction::MemoryOps MemOpVal;
648 Instruction::OtherOps OtherOpVal;
649 Module::Endianness Endianness;
652 %type <ModuleVal> Module FunctionList
653 %type <FunctionVal> Function FunctionProto FunctionHeader BasicBlockList
654 %type <BasicBlockVal> BasicBlock InstructionList
655 %type <TermInstVal> BBTerminatorInst
656 %type <InstVal> Inst InstVal MemoryInst
657 %type <ConstVal> ConstVal ConstExpr
658 %type <ConstVector> ConstVector
659 %type <ArgList> ArgList ArgListH
660 %type <ArgVal> ArgVal
661 %type <PHIList> PHIList
662 %type <ValueList> ValueRefList ValueRefListE // For call param lists
663 %type <ValueList> IndexList // For GEP derived indices
664 %type <TypeList> TypeListI ArgTypeListI
665 %type <JumpTable> JumpTable
666 %type <BoolVal> GlobalType // GLOBAL or CONSTANT?
667 %type <Linkage> OptLinkage
668 %type <Endianness> BigOrLittle
670 // ValueRef - Unresolved reference to a definition or BB
671 %type <ValIDVal> ValueRef ConstValueRef SymbolicValueRef
672 %type <ValueVal> ResolvedVal // <type> <valref> pair
673 // Tokens and types for handling constant integer values
675 // ESINT64VAL - A negative number within long long range
676 %token <SInt64Val> ESINT64VAL
678 // EUINT64VAL - A positive number within uns. long long range
679 %token <UInt64Val> EUINT64VAL
680 %type <SInt64Val> EINT64VAL
682 %token <SIntVal> SINTVAL // Signed 32 bit ints...
683 %token <UIntVal> UINTVAL // Unsigned 32 bit ints...
684 %type <SIntVal> INTVAL
685 %token <FPVal> FPVAL // Float or Double constant
688 %type <TypeVal> Types TypesV UpRTypes UpRTypesV
689 %type <PrimType> SIntType UIntType IntType FPType PrimType // Classifications
690 %token <PrimType> VOID BOOL SBYTE UBYTE SHORT USHORT INT UINT LONG ULONG
691 %token <PrimType> FLOAT DOUBLE TYPE LABEL
693 %token <StrVal> VAR_ID LABELSTR STRINGCONSTANT
694 %type <StrVal> Name OptName OptAssign
697 %token IMPLEMENTATION ZEROINITIALIZER TRUE FALSE BEGINTOK ENDTOK
698 %token DECLARE GLOBAL CONSTANT
699 %token TO EXCEPT DOTDOTDOT NULL_TOK CONST INTERNAL LINKONCE APPENDING
700 %token OPAQUE NOT EXTERNAL TARGET ENDIAN POINTERSIZE LITTLE BIG
702 // Basic Block Terminating Operators
703 %token <TermOpVal> RET BR SWITCH
706 %type <BinaryOpVal> BinaryOps // all the binary operators
707 %type <BinaryOpVal> ArithmeticOps LogicalOps SetCondOps // Binops Subcatagories
708 %token <BinaryOpVal> ADD SUB MUL DIV REM AND OR XOR
709 %token <BinaryOpVal> SETLE SETGE SETLT SETGT SETEQ SETNE // Binary Comarators
711 // Memory Instructions
712 %token <MemOpVal> MALLOC ALLOCA FREE LOAD STORE GETELEMENTPTR
715 %type <OtherOpVal> ShiftOps
716 %token <OtherOpVal> PHI CALL INVOKE CAST SHL SHR VA_ARG
721 // Handle constant integer size restriction and conversion...
725 if ($1 > (uint32_t)INT32_MAX) // Outside of my range!
726 ThrowException("Value too large for type!");
731 EINT64VAL : ESINT64VAL; // These have same type and can't cause problems...
732 EINT64VAL : EUINT64VAL {
733 if ($1 > (uint64_t)INT64_MAX) // Outside of my range!
734 ThrowException("Value too large for type!");
738 // Operations that are notably excluded from this list include:
739 // RET, BR, & SWITCH because they end basic blocks and are treated specially.
741 ArithmeticOps: ADD | SUB | MUL | DIV | REM;
742 LogicalOps : AND | OR | XOR;
743 SetCondOps : SETLE | SETGE | SETLT | SETGT | SETEQ | SETNE;
744 BinaryOps : ArithmeticOps | LogicalOps | SetCondOps;
746 ShiftOps : SHL | SHR;
748 // These are some types that allow classification if we only want a particular
749 // thing... for example, only a signed, unsigned, or integral type.
750 SIntType : LONG | INT | SHORT | SBYTE;
751 UIntType : ULONG | UINT | USHORT | UBYTE;
752 IntType : SIntType | UIntType;
753 FPType : FLOAT | DOUBLE;
755 // OptAssign - Value producing statements have an optional assignment component
756 OptAssign : Name '=' {
763 OptLinkage : INTERNAL { $$ = GlobalValue::InternalLinkage; } |
764 LINKONCE { $$ = GlobalValue::LinkOnceLinkage; } |
765 APPENDING { $$ = GlobalValue::AppendingLinkage; } |
766 /*empty*/ { $$ = GlobalValue::ExternalLinkage; };
768 //===----------------------------------------------------------------------===//
769 // Types includes all predefined types... except void, because it can only be
770 // used in specific contexts (function returning void for example). To have
771 // access to it, a user must explicitly use TypesV.
774 // TypesV includes all of 'Types', but it also includes the void type.
775 TypesV : Types | VOID { $$ = new PATypeHolder($1); };
776 UpRTypesV : UpRTypes | VOID { $$ = new PATypeHolder($1); };
780 ThrowException("Invalid upreference in type: " + (*$1)->getDescription());
785 // Derived types are added later...
787 PrimType : BOOL | SBYTE | UBYTE | SHORT | USHORT | INT | UINT ;
788 PrimType : LONG | ULONG | FLOAT | DOUBLE | TYPE | LABEL;
790 $$ = new PATypeHolder(OpaqueType::get());
793 $$ = new PATypeHolder($1);
795 UpRTypes : SymbolicValueRef { // Named types are also simple types...
796 $$ = new PATypeHolder(getTypeVal($1));
799 // Include derived types in the Types production.
801 UpRTypes : '\\' EUINT64VAL { // Type UpReference
802 if ($2 > (uint64_t)INT64_MAX) ThrowException("Value out of range!");
803 OpaqueType *OT = OpaqueType::get(); // Use temporary placeholder
804 UpRefs.push_back(std::make_pair((unsigned)$2, OT)); // Add to vector...
805 $$ = new PATypeHolder(OT);
806 UR_OUT("New Upreference!\n");
808 | UpRTypesV '(' ArgTypeListI ')' { // Function derived type?
809 std::vector<const Type*> Params;
810 mapto($3->begin(), $3->end(), std::back_inserter(Params),
811 std::mem_fun_ref(&PATypeHandle::get));
812 bool isVarArg = Params.size() && Params.back() == Type::VoidTy;
813 if (isVarArg) Params.pop_back();
815 $$ = new PATypeHolder(HandleUpRefs(FunctionType::get(*$1,Params,isVarArg)));
816 delete $3; // Delete the argument list
817 delete $1; // Delete the old type handle
819 | '[' EUINT64VAL 'x' UpRTypes ']' { // Sized array type?
820 $$ = new PATypeHolder(HandleUpRefs(ArrayType::get(*$4, (unsigned)$2)));
823 | '{' TypeListI '}' { // Structure type?
824 std::vector<const Type*> Elements;
825 mapto($2->begin(), $2->end(), std::back_inserter(Elements),
826 std::mem_fun_ref(&PATypeHandle::get));
828 $$ = new PATypeHolder(HandleUpRefs(StructType::get(Elements)));
831 | '{' '}' { // Empty structure type?
832 $$ = new PATypeHolder(StructType::get(std::vector<const Type*>()));
834 | UpRTypes '*' { // Pointer type?
835 $$ = new PATypeHolder(HandleUpRefs(PointerType::get(*$1)));
839 // TypeList - Used for struct declarations and as a basis for function type
840 // declaration type lists
842 TypeListI : UpRTypes {
843 $$ = new std::list<PATypeHolder>();
844 $$->push_back(*$1); delete $1;
846 | TypeListI ',' UpRTypes {
847 ($$=$1)->push_back(*$3); delete $3;
850 // ArgTypeList - List of types for a function type declaration...
851 ArgTypeListI : TypeListI
852 | TypeListI ',' DOTDOTDOT {
853 ($$=$1)->push_back(Type::VoidTy);
856 ($$ = new std::list<PATypeHolder>())->push_back(Type::VoidTy);
859 $$ = new std::list<PATypeHolder>();
862 // ConstVal - The various declarations that go into the constant pool. This
863 // production is used ONLY to represent constants that show up AFTER a 'const',
864 // 'constant' or 'global' token at global scope. Constants that can be inlined
865 // into other expressions (such as integers and constexprs) are handled by the
866 // ResolvedVal, ValueRef and ConstValueRef productions.
868 ConstVal: Types '[' ConstVector ']' { // Nonempty unsized arr
869 const ArrayType *ATy = dyn_cast<ArrayType>($1->get());
871 ThrowException("Cannot make array constant with type: '" +
872 (*$1)->getDescription() + "'!");
873 const Type *ETy = ATy->getElementType();
874 int NumElements = ATy->getNumElements();
876 // Verify that we have the correct size...
877 if (NumElements != -1 && NumElements != (int)$3->size())
878 ThrowException("Type mismatch: constant sized array initialized with " +
879 utostr($3->size()) + " arguments, but has size of " +
880 itostr(NumElements) + "!");
882 // Verify all elements are correct type!
883 for (unsigned i = 0; i < $3->size(); i++) {
884 if (ETy != (*$3)[i]->getType())
885 ThrowException("Element #" + utostr(i) + " is not of type '" +
886 ETy->getDescription() +"' as required!\nIt is of type '"+
887 (*$3)[i]->getType()->getDescription() + "'.");
890 $$ = ConstantArray::get(ATy, *$3);
891 delete $1; delete $3;
894 const ArrayType *ATy = dyn_cast<ArrayType>($1->get());
896 ThrowException("Cannot make array constant with type: '" +
897 (*$1)->getDescription() + "'!");
899 int NumElements = ATy->getNumElements();
900 if (NumElements != -1 && NumElements != 0)
901 ThrowException("Type mismatch: constant sized array initialized with 0"
902 " arguments, but has size of " + itostr(NumElements) +"!");
903 $$ = ConstantArray::get(ATy, std::vector<Constant*>());
906 | Types 'c' STRINGCONSTANT {
907 const ArrayType *ATy = dyn_cast<ArrayType>($1->get());
909 ThrowException("Cannot make array constant with type: '" +
910 (*$1)->getDescription() + "'!");
912 int NumElements = ATy->getNumElements();
913 const Type *ETy = ATy->getElementType();
914 char *EndStr = UnEscapeLexed($3, true);
915 if (NumElements != -1 && NumElements != (EndStr-$3))
916 ThrowException("Can't build string constant of size " +
917 itostr((int)(EndStr-$3)) +
918 " when array has size " + itostr(NumElements) + "!");
919 std::vector<Constant*> Vals;
920 if (ETy == Type::SByteTy) {
921 for (char *C = $3; C != EndStr; ++C)
922 Vals.push_back(ConstantSInt::get(ETy, *C));
923 } else if (ETy == Type::UByteTy) {
924 for (char *C = $3; C != EndStr; ++C)
925 Vals.push_back(ConstantUInt::get(ETy, (unsigned char)*C));
928 ThrowException("Cannot build string arrays of non byte sized elements!");
931 $$ = ConstantArray::get(ATy, Vals);
934 | Types '{' ConstVector '}' {
935 const StructType *STy = dyn_cast<StructType>($1->get());
937 ThrowException("Cannot make struct constant with type: '" +
938 (*$1)->getDescription() + "'!");
940 if ($3->size() != STy->getNumContainedTypes())
941 ThrowException("Illegal number of initializers for structure type!");
943 // Check to ensure that constants are compatible with the type initializer!
944 for (unsigned i = 0, e = $3->size(); i != e; ++i)
945 if ((*$3)[i]->getType() != STy->getElementTypes()[i])
946 ThrowException("Expected type '" +
947 STy->getElementTypes()[i]->getDescription() +
948 "' for element #" + utostr(i) +
949 " of structure initializer!");
951 $$ = ConstantStruct::get(STy, *$3);
952 delete $1; delete $3;
955 const StructType *STy = dyn_cast<StructType>($1->get());
957 ThrowException("Cannot make struct constant with type: '" +
958 (*$1)->getDescription() + "'!");
960 if (STy->getNumContainedTypes() != 0)
961 ThrowException("Illegal number of initializers for structure type!");
963 $$ = ConstantStruct::get(STy, std::vector<Constant*>());
967 const PointerType *PTy = dyn_cast<PointerType>($1->get());
969 ThrowException("Cannot make null pointer constant with type: '" +
970 (*$1)->getDescription() + "'!");
972 $$ = ConstantPointerNull::get(PTy);
975 | Types SymbolicValueRef {
976 const PointerType *Ty = dyn_cast<PointerType>($1->get());
978 ThrowException("Global const reference must be a pointer type!");
980 // ConstExprs can exist in the body of a function, thus creating
981 // ConstantPointerRefs whenever they refer to a variable. Because we are in
982 // the context of a function, getValNonImprovising will search the functions
983 // symbol table instead of the module symbol table for the global symbol,
984 // which throws things all off. To get around this, we just tell
985 // getValNonImprovising that we are at global scope here.
987 Function *SavedCurFn = CurMeth.CurrentFunction;
988 CurMeth.CurrentFunction = 0;
990 Value *V = getValNonImprovising(Ty, $2);
992 CurMeth.CurrentFunction = SavedCurFn;
994 // If this is an initializer for a constant pointer, which is referencing a
995 // (currently) undefined variable, create a stub now that shall be replaced
996 // in the future with the right type of variable.
999 assert(isa<PointerType>(Ty) && "Globals may only be used as pointers!");
1000 const PointerType *PT = cast<PointerType>(Ty);
1002 // First check to see if the forward references value is already created!
1003 PerModuleInfo::GlobalRefsType::iterator I =
1004 CurModule.GlobalRefs.find(std::make_pair(PT, $2));
1006 if (I != CurModule.GlobalRefs.end()) {
1007 V = I->second; // Placeholder already exists, use it...
1009 // TODO: Include line number info by creating a subclass of
1010 // TODO: GlobalVariable here that includes the said information!
1012 // Create a placeholder for the global variable reference...
1013 GlobalVariable *GV = new GlobalVariable(PT->getElementType(),
1015 GlobalValue::ExternalLinkage);
1016 // Keep track of the fact that we have a forward ref to recycle it
1017 CurModule.GlobalRefs.insert(std::make_pair(std::make_pair(PT, $2), GV));
1019 // Must temporarily push this value into the module table...
1020 CurModule.CurrentModule->getGlobalList().push_back(GV);
1025 GlobalValue *GV = cast<GlobalValue>(V);
1026 $$ = ConstantPointerRef::get(GV);
1027 delete $1; // Free the type handle
1030 if ($1->get() != $2->getType())
1031 ThrowException("Mismatched types for constant expression!");
1035 | Types ZEROINITIALIZER {
1036 $$ = Constant::getNullValue($1->get());
1040 ConstVal : SIntType EINT64VAL { // integral constants
1041 if (!ConstantSInt::isValueValidForType($1, $2))
1042 ThrowException("Constant value doesn't fit in type!");
1043 $$ = ConstantSInt::get($1, $2);
1045 | UIntType EUINT64VAL { // integral constants
1046 if (!ConstantUInt::isValueValidForType($1, $2))
1047 ThrowException("Constant value doesn't fit in type!");
1048 $$ = ConstantUInt::get($1, $2);
1050 | BOOL TRUE { // Boolean constants
1051 $$ = ConstantBool::True;
1053 | BOOL FALSE { // Boolean constants
1054 $$ = ConstantBool::False;
1056 | FPType FPVAL { // Float & Double constants
1057 $$ = ConstantFP::get($1, $2);
1061 ConstExpr: CAST '(' ConstVal TO Types ')' {
1062 $$ = ConstantExpr::getCast($3, $5->get());
1065 | GETELEMENTPTR '(' ConstVal IndexList ')' {
1066 if (!isa<PointerType>($3->getType()))
1067 ThrowException("GetElementPtr requires a pointer operand!");
1070 GetElementPtrInst::getIndexedType($3->getType(), *$4, true);
1072 ThrowException("Index list invalid for constant getelementptr!");
1074 std::vector<Constant*> IdxVec;
1075 for (unsigned i = 0, e = $4->size(); i != e; ++i)
1076 if (Constant *C = dyn_cast<Constant>((*$4)[i]))
1077 IdxVec.push_back(C);
1079 ThrowException("Indices to constant getelementptr must be constants!");
1083 $$ = ConstantExpr::getGetElementPtr($3, IdxVec);
1085 | BinaryOps '(' ConstVal ',' ConstVal ')' {
1086 if ($3->getType() != $5->getType())
1087 ThrowException("Binary operator types must match!");
1088 $$ = ConstantExpr::get($1, $3, $5);
1090 | ShiftOps '(' ConstVal ',' ConstVal ')' {
1091 if ($5->getType() != Type::UByteTy)
1092 ThrowException("Shift count for shift constant must be unsigned byte!");
1093 if (!$3->getType()->isIntegral())
1094 ThrowException("Shift constant expression requires integral operand!");
1095 $$ = ConstantExpr::getShift($1, $3, $5);
1099 // ConstVector - A list of comma separated constants.
1100 ConstVector : ConstVector ',' ConstVal {
1101 ($$ = $1)->push_back($3);
1104 $$ = new std::vector<Constant*>();
1109 // GlobalType - Match either GLOBAL or CONSTANT for global declarations...
1110 GlobalType : GLOBAL { $$ = false; } | CONSTANT { $$ = true; };
1113 //===----------------------------------------------------------------------===//
1114 // Rules to match Modules
1115 //===----------------------------------------------------------------------===//
1117 // Module rule: Capture the result of parsing the whole file into a result
1120 Module : FunctionList {
1121 $$ = ParserResult = $1;
1122 CurModule.ModuleDone();
1125 // FunctionList - A list of functions, preceeded by a constant pool.
1127 FunctionList : FunctionList Function {
1129 assert($2->getParent() == 0 && "Function already in module!");
1130 $1->getFunctionList().push_back($2);
1131 CurMeth.FunctionDone();
1133 | FunctionList FunctionProto {
1136 | FunctionList IMPLEMENTATION {
1140 $$ = CurModule.CurrentModule;
1141 // Resolve circular types before we parse the body of the module
1142 ResolveTypes(CurModule.LateResolveTypes);
1145 // ConstPool - Constants with optional names assigned to them.
1146 ConstPool : ConstPool OptAssign CONST ConstVal {
1147 if (!setValueName($4, $2))
1150 | ConstPool OptAssign TYPE TypesV { // Types can be defined in the const pool
1151 // Eagerly resolve types. This is not an optimization, this is a
1152 // requirement that is due to the fact that we could have this:
1154 // %list = type { %list * }
1155 // %list = type { %list * } ; repeated type decl
1157 // If types are not resolved eagerly, then the two types will not be
1158 // determined to be the same type!
1160 ResolveTypeTo($2, $4->get());
1162 // TODO: FIXME when Type are not const
1163 if (!setValueName(const_cast<Type*>($4->get()), $2)) {
1164 // If this is not a redefinition of a type...
1166 InsertType($4->get(),
1167 inFunctionScope() ? CurMeth.Types : CurModule.Types);
1173 | ConstPool FunctionProto { // Function prototypes can be in const pool
1175 | ConstPool OptAssign OptLinkage GlobalType ConstVal {
1176 const Type *Ty = $5->getType();
1177 // Global declarations appear in Constant Pool
1178 Constant *Initializer = $5;
1179 if (Initializer == 0)
1180 ThrowException("Global value initializer is not a constant!");
1182 GlobalVariable *GV = new GlobalVariable(Ty, $4, $3, Initializer);
1183 if (!setValueName(GV, $2)) { // If not redefining...
1184 CurModule.CurrentModule->getGlobalList().push_back(GV);
1185 int Slot = InsertValue(GV, CurModule.Values);
1188 CurModule.DeclareNewGlobalValue(GV, ValID::create(Slot));
1190 CurModule.DeclareNewGlobalValue(GV, ValID::create(
1191 (char*)GV->getName().c_str()));
1195 | ConstPool OptAssign EXTERNAL GlobalType Types {
1196 const Type *Ty = *$5;
1197 // Global declarations appear in Constant Pool
1198 GlobalVariable *GV = new GlobalVariable(Ty,$4,GlobalValue::ExternalLinkage);
1199 if (!setValueName(GV, $2)) { // If not redefining...
1200 CurModule.CurrentModule->getGlobalList().push_back(GV);
1201 int Slot = InsertValue(GV, CurModule.Values);
1204 CurModule.DeclareNewGlobalValue(GV, ValID::create(Slot));
1206 assert(GV->hasName() && "Not named and not numbered!?");
1207 CurModule.DeclareNewGlobalValue(GV, ValID::create(
1208 (char*)GV->getName().c_str()));
1213 | ConstPool TARGET TargetDefinition {
1215 | /* empty: end of list */ {
1220 BigOrLittle : BIG { $$ = Module::BigEndian; };
1221 BigOrLittle : LITTLE { $$ = Module::LittleEndian; };
1223 TargetDefinition : ENDIAN '=' BigOrLittle {
1224 CurModule.CurrentModule->setEndianness($3);
1226 | POINTERSIZE '=' EUINT64VAL {
1228 CurModule.CurrentModule->setPointerSize(Module::Pointer32);
1230 CurModule.CurrentModule->setPointerSize(Module::Pointer64);
1232 ThrowException("Invalid pointer size: '" + utostr($3) + "'!");
1236 //===----------------------------------------------------------------------===//
1237 // Rules to match Function Headers
1238 //===----------------------------------------------------------------------===//
1240 Name : VAR_ID | STRINGCONSTANT;
1241 OptName : Name | /*empty*/ { $$ = 0; };
1243 ArgVal : Types OptName {
1244 if (*$1 == Type::VoidTy)
1245 ThrowException("void typed arguments are invalid!");
1246 $$ = new std::pair<PATypeHolder*, char*>($1, $2);
1249 ArgListH : ArgListH ',' ArgVal {
1255 $$ = new std::vector<std::pair<PATypeHolder*,char*> >();
1260 ArgList : ArgListH {
1263 | ArgListH ',' DOTDOTDOT {
1265 $$->push_back(std::pair<PATypeHolder*,
1266 char*>(new PATypeHolder(Type::VoidTy), 0));
1269 $$ = new std::vector<std::pair<PATypeHolder*,char*> >();
1270 $$->push_back(std::make_pair(new PATypeHolder(Type::VoidTy), (char*)0));
1276 FunctionHeaderH : TypesV Name '(' ArgList ')' {
1278 std::string FunctionName($2);
1280 std::vector<const Type*> ParamTypeList;
1281 if ($4) { // If there are arguments...
1282 for (std::vector<std::pair<PATypeHolder*,char*> >::iterator I = $4->begin();
1283 I != $4->end(); ++I)
1284 ParamTypeList.push_back(I->first->get());
1287 bool isVarArg = ParamTypeList.size() && ParamTypeList.back() == Type::VoidTy;
1288 if (isVarArg) ParamTypeList.pop_back();
1290 const FunctionType *FT = FunctionType::get(*$1, ParamTypeList, isVarArg);
1291 const PointerType *PFT = PointerType::get(FT);
1295 // Is the function already in symtab?
1296 if ((Fn = CurModule.CurrentModule->getFunction(FunctionName, FT))) {
1297 // Yes it is. If this is the case, either we need to be a forward decl,
1298 // or it needs to be.
1299 if (!CurMeth.isDeclare && !Fn->isExternal())
1300 ThrowException("Redefinition of function '" + FunctionName + "'!");
1302 // If we found a preexisting function prototype, remove it from the
1303 // module, so that we don't get spurious conflicts with global & local
1306 CurModule.CurrentModule->getFunctionList().remove(Fn);
1308 // Make sure to strip off any argument names so we can't get conflicts...
1309 for (Function::aiterator AI = Fn->abegin(), AE = Fn->aend(); AI != AE; ++AI)
1312 } else { // Not already defined?
1313 Fn = new Function(FT, GlobalValue::ExternalLinkage, FunctionName);
1314 InsertValue(Fn, CurModule.Values);
1315 CurModule.DeclareNewGlobalValue(Fn, ValID::create($2));
1317 free($2); // Free strdup'd memory!
1319 CurMeth.FunctionStart(Fn);
1321 // Add all of the arguments we parsed to the function...
1322 if ($4) { // Is null if empty...
1323 if (isVarArg) { // Nuke the last entry
1324 assert($4->back().first->get() == Type::VoidTy && $4->back().second == 0&&
1325 "Not a varargs marker!");
1326 delete $4->back().first;
1327 $4->pop_back(); // Delete the last entry
1329 Function::aiterator ArgIt = Fn->abegin();
1330 for (std::vector<std::pair<PATypeHolder*, char*> >::iterator I =$4->begin();
1331 I != $4->end(); ++I, ++ArgIt) {
1332 delete I->first; // Delete the typeholder...
1334 if (setValueName(ArgIt, I->second)) // Insert arg into symtab...
1335 assert(0 && "No arg redef allowed!");
1340 delete $4; // We're now done with the argument list
1344 BEGIN : BEGINTOK | '{'; // Allow BEGIN or '{' to start a function
1346 FunctionHeader : OptLinkage FunctionHeaderH BEGIN {
1347 $$ = CurMeth.CurrentFunction;
1349 // Make sure that we keep track of the linkage type even if there was a
1350 // previous "declare".
1353 // Resolve circular types before we parse the body of the function.
1354 ResolveTypes(CurMeth.LateResolveTypes);
1357 END : ENDTOK | '}'; // Allow end of '}' to end a function
1359 Function : BasicBlockList END {
1363 FunctionProto : DECLARE { CurMeth.isDeclare = true; } FunctionHeaderH {
1364 $$ = CurMeth.CurrentFunction;
1365 assert($$->getParent() == 0 && "Function already in module!");
1366 CurModule.CurrentModule->getFunctionList().push_back($$);
1367 CurMeth.FunctionDone();
1370 //===----------------------------------------------------------------------===//
1371 // Rules to match Basic Blocks
1372 //===----------------------------------------------------------------------===//
1374 ConstValueRef : ESINT64VAL { // A reference to a direct constant
1375 $$ = ValID::create($1);
1378 $$ = ValID::create($1);
1380 | FPVAL { // Perhaps it's an FP constant?
1381 $$ = ValID::create($1);
1384 $$ = ValID::create(ConstantBool::True);
1387 $$ = ValID::create(ConstantBool::False);
1390 $$ = ValID::createNull();
1393 $$ = ValID::create($1);
1396 // SymbolicValueRef - Reference to one of two ways of symbolically refering to
1399 SymbolicValueRef : INTVAL { // Is it an integer reference...?
1400 $$ = ValID::create($1);
1402 | Name { // Is it a named reference...?
1403 $$ = ValID::create($1);
1406 // ValueRef - A reference to a definition... either constant or symbolic
1407 ValueRef : SymbolicValueRef | ConstValueRef;
1410 // ResolvedVal - a <type> <value> pair. This is used only in cases where the
1411 // type immediately preceeds the value reference, and allows complex constant
1412 // pool references (for things like: 'ret [2 x int] [ int 12, int 42]')
1413 ResolvedVal : Types ValueRef {
1414 $$ = getVal(*$1, $2); delete $1;
1417 BasicBlockList : BasicBlockList BasicBlock {
1418 ($$ = $1)->getBasicBlockList().push_back($2);
1420 | FunctionHeader BasicBlock { // Do not allow functions with 0 basic blocks
1421 ($$ = $1)->getBasicBlockList().push_back($2);
1425 // Basic blocks are terminated by branching instructions:
1426 // br, br/cc, switch, ret
1428 BasicBlock : InstructionList OptAssign BBTerminatorInst {
1429 if (setValueName($3, $2)) { assert(0 && "No redefn allowed!"); }
1432 $1->getInstList().push_back($3);
1436 | LABELSTR InstructionList OptAssign BBTerminatorInst {
1437 if (setValueName($4, $3)) { assert(0 && "No redefn allowed!"); }
1440 $2->getInstList().push_back($4);
1441 if (setValueName($2, $1)) { assert(0 && "No label redef allowed!"); }
1447 InstructionList : InstructionList Inst {
1448 $1->getInstList().push_back($2);
1452 $$ = new BasicBlock();
1455 BBTerminatorInst : RET ResolvedVal { // Return with a result...
1456 $$ = new ReturnInst($2);
1458 | RET VOID { // Return with no result...
1459 $$ = new ReturnInst();
1461 | BR LABEL ValueRef { // Unconditional Branch...
1462 $$ = new BranchInst(cast<BasicBlock>(getVal(Type::LabelTy, $3)));
1463 } // Conditional Branch...
1464 | BR BOOL ValueRef ',' LABEL ValueRef ',' LABEL ValueRef {
1465 $$ = new BranchInst(cast<BasicBlock>(getVal(Type::LabelTy, $6)),
1466 cast<BasicBlock>(getVal(Type::LabelTy, $9)),
1467 getVal(Type::BoolTy, $3));
1469 | SWITCH IntType ValueRef ',' LABEL ValueRef '[' JumpTable ']' {
1470 SwitchInst *S = new SwitchInst(getVal($2, $3),
1471 cast<BasicBlock>(getVal(Type::LabelTy, $6)));
1474 std::vector<std::pair<Constant*,BasicBlock*> >::iterator I = $8->begin(),
1477 S->addCase(I->first, I->second);
1479 | SWITCH IntType ValueRef ',' LABEL ValueRef '[' ']' {
1480 SwitchInst *S = new SwitchInst(getVal($2, $3),
1481 cast<BasicBlock>(getVal(Type::LabelTy, $6)));
1484 | INVOKE TypesV ValueRef '(' ValueRefListE ')' TO ResolvedVal
1485 EXCEPT ResolvedVal {
1486 const PointerType *PFTy;
1487 const FunctionType *Ty;
1489 if (!(PFTy = dyn_cast<PointerType>($2->get())) ||
1490 !(Ty = dyn_cast<FunctionType>(PFTy->getElementType()))) {
1491 // Pull out the types of all of the arguments...
1492 std::vector<const Type*> ParamTypes;
1494 for (std::vector<Value*>::iterator I = $5->begin(), E = $5->end();
1496 ParamTypes.push_back((*I)->getType());
1499 bool isVarArg = ParamTypes.size() && ParamTypes.back() == Type::VoidTy;
1500 if (isVarArg) ParamTypes.pop_back();
1502 Ty = FunctionType::get($2->get(), ParamTypes, isVarArg);
1503 PFTy = PointerType::get(Ty);
1507 Value *V = getVal(PFTy, $3); // Get the function we're calling...
1509 BasicBlock *Normal = dyn_cast<BasicBlock>($8);
1510 BasicBlock *Except = dyn_cast<BasicBlock>($10);
1512 if (Normal == 0 || Except == 0)
1513 ThrowException("Invoke instruction without label destinations!");
1515 // Create the call node...
1516 if (!$5) { // Has no arguments?
1517 $$ = new InvokeInst(V, Normal, Except, std::vector<Value*>());
1518 } else { // Has arguments?
1519 // Loop through FunctionType's arguments and ensure they are specified
1522 FunctionType::ParamTypes::const_iterator I = Ty->getParamTypes().begin();
1523 FunctionType::ParamTypes::const_iterator E = Ty->getParamTypes().end();
1524 std::vector<Value*>::iterator ArgI = $5->begin(), ArgE = $5->end();
1526 for (; ArgI != ArgE && I != E; ++ArgI, ++I)
1527 if ((*ArgI)->getType() != *I)
1528 ThrowException("Parameter " +(*ArgI)->getName()+ " is not of type '" +
1529 (*I)->getDescription() + "'!");
1531 if (I != E || (ArgI != ArgE && !Ty->isVarArg()))
1532 ThrowException("Invalid number of parameters detected!");
1534 $$ = new InvokeInst(V, Normal, Except, *$5);
1541 JumpTable : JumpTable IntType ConstValueRef ',' LABEL ValueRef {
1543 Constant *V = cast<Constant>(getValNonImprovising($2, $3));
1545 ThrowException("May only switch on a constant pool value!");
1547 $$->push_back(std::make_pair(V, cast<BasicBlock>(getVal($5, $6))));
1549 | IntType ConstValueRef ',' LABEL ValueRef {
1550 $$ = new std::vector<std::pair<Constant*, BasicBlock*> >();
1551 Constant *V = cast<Constant>(getValNonImprovising($1, $2));
1554 ThrowException("May only switch on a constant pool value!");
1556 $$->push_back(std::make_pair(V, cast<BasicBlock>(getVal($4, $5))));
1559 Inst : OptAssign InstVal {
1560 // Is this definition named?? if so, assign the name...
1561 if (setValueName($2, $1)) { assert(0 && "No redefin allowed!"); }
1566 PHIList : Types '[' ValueRef ',' ValueRef ']' { // Used for PHI nodes
1567 $$ = new std::list<std::pair<Value*, BasicBlock*> >();
1568 $$->push_back(std::make_pair(getVal(*$1, $3),
1569 cast<BasicBlock>(getVal(Type::LabelTy, $5))));
1572 | PHIList ',' '[' ValueRef ',' ValueRef ']' {
1574 $1->push_back(std::make_pair(getVal($1->front().first->getType(), $4),
1575 cast<BasicBlock>(getVal(Type::LabelTy, $6))));
1579 ValueRefList : ResolvedVal { // Used for call statements, and memory insts...
1580 $$ = new std::vector<Value*>();
1583 | ValueRefList ',' ResolvedVal {
1588 // ValueRefListE - Just like ValueRefList, except that it may also be empty!
1589 ValueRefListE : ValueRefList | /*empty*/ { $$ = 0; };
1591 InstVal : ArithmeticOps Types ValueRef ',' ValueRef {
1592 if (!(*$2)->isInteger() && !(*$2)->isFloatingPoint())
1593 ThrowException("Arithmetic operator requires integer or FP operands!");
1594 $$ = BinaryOperator::create($1, getVal(*$2, $3), getVal(*$2, $5));
1596 ThrowException("binary operator returned null!");
1599 | LogicalOps Types ValueRef ',' ValueRef {
1600 if (!(*$2)->isIntegral())
1601 ThrowException("Logical operator requires integral operands!");
1602 $$ = BinaryOperator::create($1, getVal(*$2, $3), getVal(*$2, $5));
1604 ThrowException("binary operator returned null!");
1607 | SetCondOps Types ValueRef ',' ValueRef {
1608 $$ = new SetCondInst($1, getVal(*$2, $3), getVal(*$2, $5));
1610 ThrowException("binary operator returned null!");
1614 std::cerr << "WARNING: Use of eliminated 'not' instruction:"
1615 << " Replacing with 'xor'.\n";
1617 Value *Ones = ConstantIntegral::getAllOnesValue($2->getType());
1619 ThrowException("Expected integral type for not instruction!");
1621 $$ = BinaryOperator::create(Instruction::Xor, $2, Ones);
1623 ThrowException("Could not create a xor instruction!");
1625 | ShiftOps ResolvedVal ',' ResolvedVal {
1626 if ($4->getType() != Type::UByteTy)
1627 ThrowException("Shift amount must be ubyte!");
1628 $$ = new ShiftInst($1, $2, $4);
1630 | CAST ResolvedVal TO Types {
1631 $$ = new CastInst($2, *$4);
1634 | VA_ARG ResolvedVal ',' Types {
1635 $$ = new VarArgInst($2, *$4);
1639 const Type *Ty = $2->front().first->getType();
1640 $$ = new PHINode(Ty);
1641 while ($2->begin() != $2->end()) {
1642 if ($2->front().first->getType() != Ty)
1643 ThrowException("All elements of a PHI node must be of the same type!");
1644 cast<PHINode>($$)->addIncoming($2->front().first, $2->front().second);
1647 delete $2; // Free the list...
1649 | CALL TypesV ValueRef '(' ValueRefListE ')' {
1650 const PointerType *PFTy;
1651 const FunctionType *Ty;
1653 if (!(PFTy = dyn_cast<PointerType>($2->get())) ||
1654 !(Ty = dyn_cast<FunctionType>(PFTy->getElementType()))) {
1655 // Pull out the types of all of the arguments...
1656 std::vector<const Type*> ParamTypes;
1658 for (std::vector<Value*>::iterator I = $5->begin(), E = $5->end();
1660 ParamTypes.push_back((*I)->getType());
1663 bool isVarArg = ParamTypes.size() && ParamTypes.back() == Type::VoidTy;
1664 if (isVarArg) ParamTypes.pop_back();
1666 Ty = FunctionType::get($2->get(), ParamTypes, isVarArg);
1667 PFTy = PointerType::get(Ty);
1671 Value *V = getVal(PFTy, $3); // Get the function we're calling...
1673 // Create the call node...
1674 if (!$5) { // Has no arguments?
1675 // Make sure no arguments is a good thing!
1676 if (Ty->getNumParams() != 0)
1677 ThrowException("No arguments passed to a function that "
1678 "expects arguments!");
1680 $$ = new CallInst(V, std::vector<Value*>());
1681 } else { // Has arguments?
1682 // Loop through FunctionType's arguments and ensure they are specified
1685 FunctionType::ParamTypes::const_iterator I = Ty->getParamTypes().begin();
1686 FunctionType::ParamTypes::const_iterator E = Ty->getParamTypes().end();
1687 std::vector<Value*>::iterator ArgI = $5->begin(), ArgE = $5->end();
1689 for (; ArgI != ArgE && I != E; ++ArgI, ++I)
1690 if ((*ArgI)->getType() != *I)
1691 ThrowException("Parameter " +(*ArgI)->getName()+ " is not of type '" +
1692 (*I)->getDescription() + "'!");
1694 if (I != E || (ArgI != ArgE && !Ty->isVarArg()))
1695 ThrowException("Invalid number of parameters detected!");
1697 $$ = new CallInst(V, *$5);
1706 // IndexList - List of indices for GEP based instructions...
1707 IndexList : ',' ValueRefList {
1710 $$ = new std::vector<Value*>();
1713 MemoryInst : MALLOC Types {
1714 $$ = new MallocInst(*$2);
1717 | MALLOC Types ',' UINT ValueRef {
1718 $$ = new MallocInst(*$2, getVal($4, $5));
1722 $$ = new AllocaInst(*$2);
1725 | ALLOCA Types ',' UINT ValueRef {
1726 $$ = new AllocaInst(*$2, getVal($4, $5));
1729 | FREE ResolvedVal {
1730 if (!isa<PointerType>($2->getType()))
1731 ThrowException("Trying to free nonpointer type " +
1732 $2->getType()->getDescription() + "!");
1733 $$ = new FreeInst($2);
1736 | LOAD Types ValueRef {
1737 if (!isa<PointerType>($2->get()))
1738 ThrowException("Can't load from nonpointer type: " +
1739 (*$2)->getDescription());
1740 $$ = new LoadInst(getVal(*$2, $3));
1743 | STORE ResolvedVal ',' Types ValueRef {
1744 const PointerType *PT = dyn_cast<PointerType>($4->get());
1746 ThrowException("Can't store to a nonpointer type: " +
1747 (*$4)->getDescription());
1748 const Type *ElTy = PT->getElementType();
1749 if (ElTy != $2->getType())
1750 ThrowException("Can't store '" + $2->getType()->getDescription() +
1751 "' into space of type '" + ElTy->getDescription() + "'!");
1753 $$ = new StoreInst($2, getVal(*$4, $5));
1756 | GETELEMENTPTR Types ValueRef IndexList {
1757 if (!isa<PointerType>($2->get()))
1758 ThrowException("getelementptr insn requires pointer operand!");
1759 if (!GetElementPtrInst::getIndexedType(*$2, *$4, true))
1760 ThrowException("Can't get element ptr '" + (*$2)->getDescription()+ "'!");
1761 $$ = new GetElementPtrInst(getVal(*$2, $3), *$4);
1762 delete $2; delete $4;
1766 int yyerror(const char *ErrorMsg) {
1768 = std::string((CurFilename == "-") ? std::string("<stdin>") : CurFilename)
1769 + ":" + utostr((unsigned) llvmAsmlineno) + ": ";
1770 std::string errMsg = std::string(ErrorMsg) + "\n" + where + " while reading ";
1771 if (yychar == YYEMPTY)
1772 errMsg += "end-of-file.";
1774 errMsg += "token: '" + std::string(llvmAsmtext, llvmAsmleng) + "'";
1775 ThrowException(errMsg);