1 //===- TGParser.cpp - Parser for TableGen Files ---------------------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // Implement the Parser for TableGen.
12 //===----------------------------------------------------------------------===//
18 #include "llvm/ADT/StringExtras.h"
21 //===----------------------------------------------------------------------===//
22 // Support Code for the Semantic Actions.
23 //===----------------------------------------------------------------------===//
27 Record Rec; // Placeholder for template args and Name.
28 std::vector<Record*> DefPrototypes;
30 MultiClass(const std::string &Name, TGLoc Loc) : Rec(Name, Loc) {}
33 struct SubClassReference {
36 std::vector<Init*> TemplateArgs;
37 SubClassReference() : Rec(0) {}
39 bool isInvalid() const { return Rec == 0; }
42 } // end namespace llvm
44 bool TGParser::AddValue(Record *CurRec, TGLoc Loc, const RecordVal &RV) {
46 CurRec = &CurMultiClass->Rec;
48 if (RecordVal *ERV = CurRec->getValue(RV.getName())) {
49 // The value already exists in the class, treat this as a set.
50 if (ERV->setValue(RV.getValue()))
51 return Error(Loc, "New definition of '" + RV.getName() + "' of type '" +
52 RV.getType()->getAsString() + "' is incompatible with " +
53 "previous definition of type '" +
54 ERV->getType()->getAsString() + "'");
62 /// Return true on error, false on success.
63 bool TGParser::SetValue(Record *CurRec, TGLoc Loc, const std::string &ValName,
64 const std::vector<unsigned> &BitList, Init *V) {
67 if (CurRec == 0) CurRec = &CurMultiClass->Rec;
69 RecordVal *RV = CurRec->getValue(ValName);
71 return Error(Loc, "Value '" + ValName + "' unknown!");
73 // Do not allow assignments like 'X = X'. This will just cause infinite loops
74 // in the resolution machinery.
76 if (VarInit *VI = dynamic_cast<VarInit*>(V))
77 if (VI->getName() == ValName)
80 // If we are assigning to a subset of the bits in the value... then we must be
81 // assigning to a field of BitsRecTy, which must have a BitsInit
84 if (!BitList.empty()) {
85 BitsInit *CurVal = dynamic_cast<BitsInit*>(RV->getValue());
87 return Error(Loc, "Value '" + ValName + "' is not a bits type");
89 // Convert the incoming value to a bits type of the appropriate size...
90 Init *BI = V->convertInitializerTo(new BitsRecTy(BitList.size()));
92 V->convertInitializerTo(new BitsRecTy(BitList.size()));
93 return Error(Loc, "Initializer is not compatible with bit range");
96 // We should have a BitsInit type now.
97 BitsInit *BInit = dynamic_cast<BitsInit*>(BI);
100 BitsInit *NewVal = new BitsInit(CurVal->getNumBits());
102 // Loop over bits, assigning values as appropriate.
103 for (unsigned i = 0, e = BitList.size(); i != e; ++i) {
104 unsigned Bit = BitList[i];
105 if (NewVal->getBit(Bit))
106 return Error(Loc, "Cannot set bit #" + utostr(Bit) + " of value '" +
107 ValName + "' more than once");
108 NewVal->setBit(Bit, BInit->getBit(i));
111 for (unsigned i = 0, e = CurVal->getNumBits(); i != e; ++i)
112 if (NewVal->getBit(i) == 0)
113 NewVal->setBit(i, CurVal->getBit(i));
119 return Error(Loc, "Value '" + ValName + "' of type '" +
120 RV->getType()->getAsString() +
121 "' is incompatible with initializer '" + V->getAsString() +"'");
125 /// AddSubClass - Add SubClass as a subclass to CurRec, resolving its template
126 /// args as SubClass's template arguments.
127 bool TGParser::AddSubClass(Record *CurRec, SubClassReference &SubClass) {
128 Record *SC = SubClass.Rec;
129 // Add all of the values in the subclass into the current class.
130 const std::vector<RecordVal> &Vals = SC->getValues();
131 for (unsigned i = 0, e = Vals.size(); i != e; ++i)
132 if (AddValue(CurRec, SubClass.RefLoc, Vals[i]))
135 const std::vector<std::string> &TArgs = SC->getTemplateArgs();
137 // Ensure that an appropriate number of template arguments are specified.
138 if (TArgs.size() < SubClass.TemplateArgs.size())
139 return Error(SubClass.RefLoc, "More template args specified than expected");
141 // Loop over all of the template arguments, setting them to the specified
142 // value or leaving them as the default if necessary.
143 for (unsigned i = 0, e = TArgs.size(); i != e; ++i) {
144 if (i < SubClass.TemplateArgs.size()) {
145 // If a value is specified for this template arg, set it now.
146 if (SetValue(CurRec, SubClass.RefLoc, TArgs[i], std::vector<unsigned>(),
147 SubClass.TemplateArgs[i]))
151 CurRec->resolveReferencesTo(CurRec->getValue(TArgs[i]));
154 CurRec->removeValue(TArgs[i]);
156 } else if (!CurRec->getValue(TArgs[i])->getValue()->isComplete()) {
157 return Error(SubClass.RefLoc,"Value not specified for template argument #"
158 + utostr(i) + " (" + TArgs[i] + ") of subclass '" +
159 SC->getName() + "'!");
163 // Since everything went well, we can now set the "superclass" list for the
165 const std::vector<Record*> &SCs = SC->getSuperClasses();
166 for (unsigned i = 0, e = SCs.size(); i != e; ++i) {
167 if (CurRec->isSubClassOf(SCs[i]))
168 return Error(SubClass.RefLoc,
169 "Already subclass of '" + SCs[i]->getName() + "'!\n");
170 CurRec->addSuperClass(SCs[i]);
173 if (CurRec->isSubClassOf(SC))
174 return Error(SubClass.RefLoc,
175 "Already subclass of '" + SC->getName() + "'!\n");
176 CurRec->addSuperClass(SC);
180 //===----------------------------------------------------------------------===//
182 //===----------------------------------------------------------------------===//
184 /// isObjectStart - Return true if this is a valid first token for an Object.
185 static bool isObjectStart(tgtok::TokKind K) {
186 return K == tgtok::Class || K == tgtok::Def ||
187 K == tgtok::Defm || K == tgtok::Let || K == tgtok::MultiClass;
190 /// ParseObjectName - If an object name is specified, return it. Otherwise,
191 /// return an anonymous name.
192 /// ObjectName ::= ID
193 /// ObjectName ::= /*empty*/
195 std::string TGParser::ParseObjectName() {
196 if (Lex.getCode() == tgtok::Id) {
197 std::string Ret = Lex.getCurStrVal();
202 static unsigned AnonCounter = 0;
203 return "anonymous."+utostr(AnonCounter++);
207 /// ParseClassID - Parse and resolve a reference to a class name. This returns
212 Record *TGParser::ParseClassID() {
213 if (Lex.getCode() != tgtok::Id) {
214 TokError("expected name for ClassID");
218 Record *Result = Records.getClass(Lex.getCurStrVal());
220 TokError("Couldn't find class '" + Lex.getCurStrVal() + "'");
226 Record *TGParser::ParseDefmID() {
227 if (Lex.getCode() != tgtok::Id) {
228 TokError("expected multiclass name");
232 MultiClass *MC = MultiClasses[Lex.getCurStrVal()];
234 TokError("Couldn't find multiclass '" + Lex.getCurStrVal() + "'");
244 /// ParseSubClassReference - Parse a reference to a subclass or to a templated
245 /// subclass. This returns a SubClassRefTy with a null Record* on error.
247 /// SubClassRef ::= ClassID
248 /// SubClassRef ::= ClassID '<' ValueList '>'
250 SubClassReference TGParser::
251 ParseSubClassReference(Record *CurRec, bool isDefm) {
252 SubClassReference Result;
253 Result.RefLoc = Lex.getLoc();
256 Result.Rec = ParseDefmID();
258 Result.Rec = ParseClassID();
259 if (Result.Rec == 0) return Result;
261 // If there is no template arg list, we're done.
262 if (Lex.getCode() != tgtok::less)
264 Lex.Lex(); // Eat the '<'
266 if (Lex.getCode() == tgtok::greater) {
267 TokError("subclass reference requires a non-empty list of template values");
272 Result.TemplateArgs = ParseValueList(CurRec);
273 if (Result.TemplateArgs.empty()) {
274 Result.Rec = 0; // Error parsing value list.
278 if (Lex.getCode() != tgtok::greater) {
279 TokError("expected '>' in template value list");
288 /// ParseRangePiece - Parse a bit/value range.
289 /// RangePiece ::= INTVAL
290 /// RangePiece ::= INTVAL '-' INTVAL
291 /// RangePiece ::= INTVAL INTVAL
292 bool TGParser::ParseRangePiece(std::vector<unsigned> &Ranges) {
293 if (Lex.getCode() != tgtok::IntVal) {
294 TokError("expected integer or bitrange");
297 int64_t Start = Lex.getCurIntVal();
301 return TokError("invalid range, cannot be negative");
303 switch (Lex.Lex()) { // eat first character.
305 Ranges.push_back(Start);
308 if (Lex.Lex() != tgtok::IntVal) {
309 TokError("expected integer value as end of range");
312 End = Lex.getCurIntVal();
315 End = -Lex.getCurIntVal();
319 return TokError("invalid range, cannot be negative");
324 for (; Start <= End; ++Start)
325 Ranges.push_back(Start);
327 for (; Start >= End; --Start)
328 Ranges.push_back(Start);
333 /// ParseRangeList - Parse a list of scalars and ranges into scalar values.
335 /// RangeList ::= RangePiece (',' RangePiece)*
337 std::vector<unsigned> TGParser::ParseRangeList() {
338 std::vector<unsigned> Result;
340 // Parse the first piece.
341 if (ParseRangePiece(Result))
342 return std::vector<unsigned>();
343 while (Lex.getCode() == tgtok::comma) {
344 Lex.Lex(); // Eat the comma.
346 // Parse the next range piece.
347 if (ParseRangePiece(Result))
348 return std::vector<unsigned>();
353 /// ParseOptionalRangeList - Parse either a range list in <>'s or nothing.
354 /// OptionalRangeList ::= '<' RangeList '>'
355 /// OptionalRangeList ::= /*empty*/
356 bool TGParser::ParseOptionalRangeList(std::vector<unsigned> &Ranges) {
357 if (Lex.getCode() != tgtok::less)
360 TGLoc StartLoc = Lex.getLoc();
361 Lex.Lex(); // eat the '<'
363 // Parse the range list.
364 Ranges = ParseRangeList();
365 if (Ranges.empty()) return true;
367 if (Lex.getCode() != tgtok::greater) {
368 TokError("expected '>' at end of range list");
369 return Error(StartLoc, "to match this '<'");
371 Lex.Lex(); // eat the '>'.
375 /// ParseOptionalBitList - Parse either a bit list in {}'s or nothing.
376 /// OptionalBitList ::= '{' RangeList '}'
377 /// OptionalBitList ::= /*empty*/
378 bool TGParser::ParseOptionalBitList(std::vector<unsigned> &Ranges) {
379 if (Lex.getCode() != tgtok::l_brace)
382 TGLoc StartLoc = Lex.getLoc();
383 Lex.Lex(); // eat the '{'
385 // Parse the range list.
386 Ranges = ParseRangeList();
387 if (Ranges.empty()) return true;
389 if (Lex.getCode() != tgtok::r_brace) {
390 TokError("expected '}' at end of bit list");
391 return Error(StartLoc, "to match this '{'");
393 Lex.Lex(); // eat the '}'.
398 /// ParseType - Parse and return a tblgen type. This returns null on error.
400 /// Type ::= STRING // string type
401 /// Type ::= BIT // bit type
402 /// Type ::= BITS '<' INTVAL '>' // bits<x> type
403 /// Type ::= INT // int type
404 /// Type ::= LIST '<' Type '>' // list<x> type
405 /// Type ::= CODE // code type
406 /// Type ::= DAG // dag type
407 /// Type ::= ClassID // Record Type
409 RecTy *TGParser::ParseType() {
410 switch (Lex.getCode()) {
411 default: TokError("Unknown token when expecting a type"); return 0;
412 case tgtok::String: Lex.Lex(); return new StringRecTy();
413 case tgtok::Bit: Lex.Lex(); return new BitRecTy();
414 case tgtok::Int: Lex.Lex(); return new IntRecTy();
415 case tgtok::Code: Lex.Lex(); return new CodeRecTy();
416 case tgtok::Dag: Lex.Lex(); return new DagRecTy();
418 if (Record *R = ParseClassID()) return new RecordRecTy(R);
421 if (Lex.Lex() != tgtok::less) { // Eat 'bits'
422 TokError("expected '<' after bits type");
425 if (Lex.Lex() != tgtok::IntVal) { // Eat '<'
426 TokError("expected integer in bits<n> type");
429 uint64_t Val = Lex.getCurIntVal();
430 if (Lex.Lex() != tgtok::greater) { // Eat count.
431 TokError("expected '>' at end of bits<n> type");
434 Lex.Lex(); // Eat '>'
435 return new BitsRecTy(Val);
438 if (Lex.Lex() != tgtok::less) { // Eat 'bits'
439 TokError("expected '<' after list type");
442 Lex.Lex(); // Eat '<'
443 RecTy *SubType = ParseType();
444 if (SubType == 0) return 0;
446 if (Lex.getCode() != tgtok::greater) {
447 TokError("expected '>' at end of list<ty> type");
450 Lex.Lex(); // Eat '>'
451 return new ListRecTy(SubType);
456 /// ParseIDValue - Parse an ID as a value and decode what it means.
458 /// IDValue ::= ID [def local value]
459 /// IDValue ::= ID [def template arg]
460 /// IDValue ::= ID [multiclass local value]
461 /// IDValue ::= ID [multiclass template argument]
462 /// IDValue ::= ID [def name]
464 Init *TGParser::ParseIDValue(Record *CurRec) {
465 assert(Lex.getCode() == tgtok::Id && "Expected ID in ParseIDValue");
466 std::string Name = Lex.getCurStrVal();
467 TGLoc Loc = Lex.getLoc();
469 return ParseIDValue(CurRec, Name, Loc);
472 /// ParseIDValue - This is just like ParseIDValue above, but it assumes the ID
473 /// has already been read.
474 Init *TGParser::ParseIDValue(Record *CurRec,
475 const std::string &Name, TGLoc NameLoc) {
477 if (const RecordVal *RV = CurRec->getValue(Name))
478 return new VarInit(Name, RV->getType());
480 std::string TemplateArgName = CurRec->getName()+":"+Name;
481 if (CurRec->isTemplateArg(TemplateArgName)) {
482 const RecordVal *RV = CurRec->getValue(TemplateArgName);
483 assert(RV && "Template arg doesn't exist??");
484 return new VarInit(TemplateArgName, RV->getType());
489 std::string MCName = CurMultiClass->Rec.getName()+"::"+Name;
490 if (CurMultiClass->Rec.isTemplateArg(MCName)) {
491 const RecordVal *RV = CurMultiClass->Rec.getValue(MCName);
492 assert(RV && "Template arg doesn't exist??");
493 return new VarInit(MCName, RV->getType());
497 if (Record *D = Records.getDef(Name))
498 return new DefInit(D);
500 Error(NameLoc, "Variable not defined: '" + Name + "'");
504 /// ParseSimpleValue - Parse a tblgen value. This returns null on error.
506 /// SimpleValue ::= IDValue
507 /// SimpleValue ::= INTVAL
508 /// SimpleValue ::= STRVAL+
509 /// SimpleValue ::= CODEFRAGMENT
510 /// SimpleValue ::= '?'
511 /// SimpleValue ::= '{' ValueList '}'
512 /// SimpleValue ::= ID '<' ValueListNE '>'
513 /// SimpleValue ::= '[' ValueList ']'
514 /// SimpleValue ::= '(' IDValue DagArgList ')'
515 /// SimpleValue ::= CONCATTOK '(' Value ',' Value ')'
516 /// SimpleValue ::= SHLTOK '(' Value ',' Value ')'
517 /// SimpleValue ::= SRATOK '(' Value ',' Value ')'
518 /// SimpleValue ::= SRLTOK '(' Value ',' Value ')'
519 /// SimpleValue ::= STRCONCATTOK '(' Value ',' Value ')'
521 Init *TGParser::ParseSimpleValue(Record *CurRec) {
523 switch (Lex.getCode()) {
524 default: TokError("Unknown token when parsing a value"); break;
525 case tgtok::IntVal: R = new IntInit(Lex.getCurIntVal()); Lex.Lex(); break;
526 case tgtok::StrVal: {
527 std::string Val = Lex.getCurStrVal();
530 // Handle multiple consequtive concatenated strings.
531 while (Lex.getCode() == tgtok::StrVal) {
532 Val += Lex.getCurStrVal();
536 R = new StringInit(Val);
539 case tgtok::CodeFragment:
540 R = new CodeInit(Lex.getCurStrVal()); Lex.Lex(); break;
541 case tgtok::question: R = new UnsetInit(); Lex.Lex(); break;
543 TGLoc NameLoc = Lex.getLoc();
544 std::string Name = Lex.getCurStrVal();
545 if (Lex.Lex() != tgtok::less) // consume the Id.
546 return ParseIDValue(CurRec, Name, NameLoc); // Value ::= IDValue
548 // Value ::= ID '<' ValueListNE '>'
549 if (Lex.Lex() == tgtok::greater) {
550 TokError("expected non-empty value list");
553 std::vector<Init*> ValueList = ParseValueList(CurRec);
554 if (ValueList.empty()) return 0;
556 if (Lex.getCode() != tgtok::greater) {
557 TokError("expected '>' at end of value list");
560 Lex.Lex(); // eat the '>'
562 // This is a CLASS<initvalslist> expression. This is supposed to synthesize
563 // a new anonymous definition, deriving from CLASS<initvalslist> with no
565 Record *Class = Records.getClass(Name);
567 Error(NameLoc, "Expected a class name, got '" + Name + "'");
571 // Create the new record, set it as CurRec temporarily.
572 static unsigned AnonCounter = 0;
573 Record *NewRec = new Record("anonymous.val."+utostr(AnonCounter++),NameLoc);
574 SubClassReference SCRef;
575 SCRef.RefLoc = NameLoc;
577 SCRef.TemplateArgs = ValueList;
578 // Add info about the subclass to NewRec.
579 if (AddSubClass(NewRec, SCRef))
581 NewRec->resolveReferences();
582 Records.addDef(NewRec);
584 // The result of the expression is a reference to the new record.
585 return new DefInit(NewRec);
587 case tgtok::l_brace: { // Value ::= '{' ValueList '}'
588 TGLoc BraceLoc = Lex.getLoc();
589 Lex.Lex(); // eat the '{'
590 std::vector<Init*> Vals;
592 if (Lex.getCode() != tgtok::r_brace) {
593 Vals = ParseValueList(CurRec);
594 if (Vals.empty()) return 0;
596 if (Lex.getCode() != tgtok::r_brace) {
597 TokError("expected '}' at end of bit list value");
600 Lex.Lex(); // eat the '}'
602 BitsInit *Result = new BitsInit(Vals.size());
603 for (unsigned i = 0, e = Vals.size(); i != e; ++i) {
604 Init *Bit = Vals[i]->convertInitializerTo(new BitRecTy());
606 Error(BraceLoc, "Element #" + utostr(i) + " (" + Vals[i]->getAsString()+
607 ") is not convertable to a bit");
610 Result->setBit(Vals.size()-i-1, Bit);
614 case tgtok::l_square: { // Value ::= '[' ValueList ']'
615 Lex.Lex(); // eat the '['
616 std::vector<Init*> Vals;
618 if (Lex.getCode() != tgtok::r_square) {
619 Vals = ParseValueList(CurRec);
620 if (Vals.empty()) return 0;
622 if (Lex.getCode() != tgtok::r_square) {
623 TokError("expected ']' at end of list value");
626 Lex.Lex(); // eat the ']'
627 return new ListInit(Vals);
629 case tgtok::l_paren: { // Value ::= '(' IDValue DagArgList ')'
630 Lex.Lex(); // eat the '('
631 if (Lex.getCode() != tgtok::Id) {
632 TokError("expected identifier in dag init");
636 Init *Operator = ParseIDValue(CurRec);
637 if (Operator == 0) return 0;
639 // If the operator name is present, parse it.
640 std::string OperatorName;
641 if (Lex.getCode() == tgtok::colon) {
642 if (Lex.Lex() != tgtok::VarName) { // eat the ':'
643 TokError("expected variable name in dag operator");
646 OperatorName = Lex.getCurStrVal();
647 Lex.Lex(); // eat the VarName.
651 std::vector<std::pair<llvm::Init*, std::string> > DagArgs;
652 if (Lex.getCode() != tgtok::r_paren) {
653 DagArgs = ParseDagArgList(CurRec);
654 if (DagArgs.empty()) return 0;
657 if (Lex.getCode() != tgtok::r_paren) {
658 TokError("expected ')' in dag init");
661 Lex.Lex(); // eat the ')'
663 return new DagInit(Operator, OperatorName, DagArgs);
669 case tgtok::XStrConcat: { // Value ::= !binop '(' Value ',' Value ')'
670 BinOpInit::BinaryOp Code;
671 switch (Lex.getCode()) {
672 default: assert(0 && "Unhandled code!");
673 case tgtok::XConcat: Code = BinOpInit::CONCAT; break;
674 case tgtok::XSRA: Code = BinOpInit::SRA; break;
675 case tgtok::XSRL: Code = BinOpInit::SRL; break;
676 case tgtok::XSHL: Code = BinOpInit::SHL; break;
677 case tgtok::XStrConcat: Code = BinOpInit::STRCONCAT; break;
679 Lex.Lex(); // eat the operation
680 if (Lex.getCode() != tgtok::l_paren) {
681 TokError("expected '(' after binary operator");
684 Lex.Lex(); // eat the '('
686 Init *LHS = ParseValue(CurRec);
687 if (LHS == 0) return 0;
689 if (Lex.getCode() != tgtok::comma) {
690 TokError("expected ',' in binary operator");
693 Lex.Lex(); // eat the ','
695 Init *RHS = ParseValue(CurRec);
696 if (RHS == 0) return 0;
698 if (Lex.getCode() != tgtok::r_paren) {
699 TokError("expected ')' in binary operator");
702 Lex.Lex(); // eat the ')'
703 return (new BinOpInit(Code, LHS, RHS))->Fold();
710 /// ParseValue - Parse a tblgen value. This returns null on error.
712 /// Value ::= SimpleValue ValueSuffix*
713 /// ValueSuffix ::= '{' BitList '}'
714 /// ValueSuffix ::= '[' BitList ']'
715 /// ValueSuffix ::= '.' ID
717 Init *TGParser::ParseValue(Record *CurRec) {
718 Init *Result = ParseSimpleValue(CurRec);
719 if (Result == 0) return 0;
721 // Parse the suffixes now if present.
723 switch (Lex.getCode()) {
724 default: return Result;
725 case tgtok::l_brace: {
726 TGLoc CurlyLoc = Lex.getLoc();
727 Lex.Lex(); // eat the '{'
728 std::vector<unsigned> Ranges = ParseRangeList();
729 if (Ranges.empty()) return 0;
731 // Reverse the bitlist.
732 std::reverse(Ranges.begin(), Ranges.end());
733 Result = Result->convertInitializerBitRange(Ranges);
735 Error(CurlyLoc, "Invalid bit range for value");
740 if (Lex.getCode() != tgtok::r_brace) {
741 TokError("expected '}' at end of bit range list");
747 case tgtok::l_square: {
748 TGLoc SquareLoc = Lex.getLoc();
749 Lex.Lex(); // eat the '['
750 std::vector<unsigned> Ranges = ParseRangeList();
751 if (Ranges.empty()) return 0;
753 Result = Result->convertInitListSlice(Ranges);
755 Error(SquareLoc, "Invalid range for list slice");
760 if (Lex.getCode() != tgtok::r_square) {
761 TokError("expected ']' at end of list slice");
768 if (Lex.Lex() != tgtok::Id) { // eat the .
769 TokError("expected field identifier after '.'");
772 if (!Result->getFieldType(Lex.getCurStrVal())) {
773 TokError("Cannot access field '" + Lex.getCurStrVal() + "' of value '" +
774 Result->getAsString() + "'");
777 Result = new FieldInit(Result, Lex.getCurStrVal());
778 Lex.Lex(); // eat field name
784 /// ParseDagArgList - Parse the argument list for a dag literal expression.
786 /// ParseDagArgList ::= Value (':' VARNAME)?
787 /// ParseDagArgList ::= ParseDagArgList ',' Value (':' VARNAME)?
788 std::vector<std::pair<llvm::Init*, std::string> >
789 TGParser::ParseDagArgList(Record *CurRec) {
790 std::vector<std::pair<llvm::Init*, std::string> > Result;
793 Init *Val = ParseValue(CurRec);
794 if (Val == 0) return std::vector<std::pair<llvm::Init*, std::string> >();
796 // If the variable name is present, add it.
798 if (Lex.getCode() == tgtok::colon) {
799 if (Lex.Lex() != tgtok::VarName) { // eat the ':'
800 TokError("expected variable name in dag literal");
801 return std::vector<std::pair<llvm::Init*, std::string> >();
803 VarName = Lex.getCurStrVal();
804 Lex.Lex(); // eat the VarName.
807 Result.push_back(std::make_pair(Val, VarName));
809 if (Lex.getCode() != tgtok::comma) break;
810 Lex.Lex(); // eat the ','
817 /// ParseValueList - Parse a comma separated list of values, returning them as a
818 /// vector. Note that this always expects to be able to parse at least one
819 /// value. It returns an empty list if this is not possible.
821 /// ValueList ::= Value (',' Value)
823 std::vector<Init*> TGParser::ParseValueList(Record *CurRec) {
824 std::vector<Init*> Result;
825 Result.push_back(ParseValue(CurRec));
826 if (Result.back() == 0) return std::vector<Init*>();
828 while (Lex.getCode() == tgtok::comma) {
829 Lex.Lex(); // Eat the comma
831 Result.push_back(ParseValue(CurRec));
832 if (Result.back() == 0) return std::vector<Init*>();
840 /// ParseDeclaration - Read a declaration, returning the name of field ID, or an
841 /// empty string on error. This can happen in a number of different context's,
842 /// including within a def or in the template args for a def (which which case
843 /// CurRec will be non-null) and within the template args for a multiclass (in
844 /// which case CurRec will be null, but CurMultiClass will be set). This can
845 /// also happen within a def that is within a multiclass, which will set both
846 /// CurRec and CurMultiClass.
848 /// Declaration ::= FIELD? Type ID ('=' Value)?
850 std::string TGParser::ParseDeclaration(Record *CurRec,
851 bool ParsingTemplateArgs) {
852 // Read the field prefix if present.
853 bool HasField = Lex.getCode() == tgtok::Field;
854 if (HasField) Lex.Lex();
856 RecTy *Type = ParseType();
857 if (Type == 0) return "";
859 if (Lex.getCode() != tgtok::Id) {
860 TokError("Expected identifier in declaration");
864 TGLoc IdLoc = Lex.getLoc();
865 std::string DeclName = Lex.getCurStrVal();
868 if (ParsingTemplateArgs) {
870 DeclName = CurRec->getName() + ":" + DeclName;
872 assert(CurMultiClass);
875 DeclName = CurMultiClass->Rec.getName() + "::" + DeclName;
879 if (AddValue(CurRec, IdLoc, RecordVal(DeclName, Type, HasField)))
882 // If a value is present, parse it.
883 if (Lex.getCode() == tgtok::equal) {
885 TGLoc ValLoc = Lex.getLoc();
886 Init *Val = ParseValue(CurRec);
888 SetValue(CurRec, ValLoc, DeclName, std::vector<unsigned>(), Val))
895 /// ParseTemplateArgList - Read a template argument list, which is a non-empty
896 /// sequence of template-declarations in <>'s. If CurRec is non-null, these are
897 /// template args for a def, which may or may not be in a multiclass. If null,
898 /// these are the template args for a multiclass.
900 /// TemplateArgList ::= '<' Declaration (',' Declaration)* '>'
902 bool TGParser::ParseTemplateArgList(Record *CurRec) {
903 assert(Lex.getCode() == tgtok::less && "Not a template arg list!");
904 Lex.Lex(); // eat the '<'
906 Record *TheRecToAddTo = CurRec ? CurRec : &CurMultiClass->Rec;
908 // Read the first declaration.
909 std::string TemplArg = ParseDeclaration(CurRec, true/*templateargs*/);
910 if (TemplArg.empty())
913 TheRecToAddTo->addTemplateArg(TemplArg);
915 while (Lex.getCode() == tgtok::comma) {
916 Lex.Lex(); // eat the ','
918 // Read the following declarations.
919 TemplArg = ParseDeclaration(CurRec, true/*templateargs*/);
920 if (TemplArg.empty())
922 TheRecToAddTo->addTemplateArg(TemplArg);
925 if (Lex.getCode() != tgtok::greater)
926 return TokError("expected '>' at end of template argument list");
927 Lex.Lex(); // eat the '>'.
932 /// ParseBodyItem - Parse a single item at within the body of a def or class.
934 /// BodyItem ::= Declaration ';'
935 /// BodyItem ::= LET ID OptionalBitList '=' Value ';'
936 bool TGParser::ParseBodyItem(Record *CurRec) {
937 if (Lex.getCode() != tgtok::Let) {
938 if (ParseDeclaration(CurRec, false).empty())
941 if (Lex.getCode() != tgtok::semi)
942 return TokError("expected ';' after declaration");
947 // LET ID OptionalRangeList '=' Value ';'
948 if (Lex.Lex() != tgtok::Id)
949 return TokError("expected field identifier after let");
951 TGLoc IdLoc = Lex.getLoc();
952 std::string FieldName = Lex.getCurStrVal();
953 Lex.Lex(); // eat the field name.
955 std::vector<unsigned> BitList;
956 if (ParseOptionalBitList(BitList))
958 std::reverse(BitList.begin(), BitList.end());
960 if (Lex.getCode() != tgtok::equal)
961 return TokError("expected '=' in let expression");
962 Lex.Lex(); // eat the '='.
964 Init *Val = ParseValue(CurRec);
965 if (Val == 0) return true;
967 if (Lex.getCode() != tgtok::semi)
968 return TokError("expected ';' after let expression");
971 return SetValue(CurRec, IdLoc, FieldName, BitList, Val);
974 /// ParseBody - Read the body of a class or def. Return true on error, false on
978 /// Body ::= '{' BodyList '}'
979 /// BodyList BodyItem*
981 bool TGParser::ParseBody(Record *CurRec) {
982 // If this is a null definition, just eat the semi and return.
983 if (Lex.getCode() == tgtok::semi) {
988 if (Lex.getCode() != tgtok::l_brace)
989 return TokError("Expected ';' or '{' to start body");
993 while (Lex.getCode() != tgtok::r_brace)
994 if (ParseBodyItem(CurRec))
1002 /// ParseObjectBody - Parse the body of a def or class. This consists of an
1003 /// optional ClassList followed by a Body. CurRec is the current def or class
1004 /// that is being parsed.
1006 /// ObjectBody ::= BaseClassList Body
1007 /// BaseClassList ::= /*empty*/
1008 /// BaseClassList ::= ':' BaseClassListNE
1009 /// BaseClassListNE ::= SubClassRef (',' SubClassRef)*
1011 bool TGParser::ParseObjectBody(Record *CurRec) {
1012 // If there is a baseclass list, read it.
1013 if (Lex.getCode() == tgtok::colon) {
1016 // Read all of the subclasses.
1017 SubClassReference SubClass = ParseSubClassReference(CurRec, false);
1020 if (SubClass.Rec == 0) return true;
1023 if (AddSubClass(CurRec, SubClass))
1026 if (Lex.getCode() != tgtok::comma) break;
1027 Lex.Lex(); // eat ','.
1028 SubClass = ParseSubClassReference(CurRec, false);
1032 // Process any variables on the let stack.
1033 for (unsigned i = 0, e = LetStack.size(); i != e; ++i)
1034 for (unsigned j = 0, e = LetStack[i].size(); j != e; ++j)
1035 if (SetValue(CurRec, LetStack[i][j].Loc, LetStack[i][j].Name,
1036 LetStack[i][j].Bits, LetStack[i][j].Value))
1039 return ParseBody(CurRec);
1043 /// ParseDef - Parse and return a top level or multiclass def, return the record
1044 /// corresponding to it. This returns null on error.
1046 /// DefInst ::= DEF ObjectName ObjectBody
1048 llvm::Record *TGParser::ParseDef(MultiClass *CurMultiClass) {
1049 TGLoc DefLoc = Lex.getLoc();
1050 assert(Lex.getCode() == tgtok::Def && "Unknown tok");
1051 Lex.Lex(); // Eat the 'def' token.
1053 // Parse ObjectName and make a record for it.
1054 Record *CurRec = new Record(ParseObjectName(), DefLoc);
1056 if (!CurMultiClass) {
1057 // Top-level def definition.
1059 // Ensure redefinition doesn't happen.
1060 if (Records.getDef(CurRec->getName())) {
1061 Error(DefLoc, "def '" + CurRec->getName() + "' already defined");
1064 Records.addDef(CurRec);
1066 // Otherwise, a def inside a multiclass, add it to the multiclass.
1067 for (unsigned i = 0, e = CurMultiClass->DefPrototypes.size(); i != e; ++i)
1068 if (CurMultiClass->DefPrototypes[i]->getName() == CurRec->getName()) {
1069 Error(DefLoc, "def '" + CurRec->getName() +
1070 "' already defined in this multiclass!");
1073 CurMultiClass->DefPrototypes.push_back(CurRec);
1076 if (ParseObjectBody(CurRec))
1079 if (CurMultiClass == 0) // Def's in multiclasses aren't really defs.
1080 CurRec->resolveReferences();
1082 // If ObjectBody has template arguments, it's an error.
1083 assert(CurRec->getTemplateArgs().empty() && "How'd this get template args?");
1088 /// ParseClass - Parse a tblgen class definition.
1090 /// ClassInst ::= CLASS ID TemplateArgList? ObjectBody
1092 bool TGParser::ParseClass() {
1093 assert(Lex.getCode() == tgtok::Class && "Unexpected token!");
1096 if (Lex.getCode() != tgtok::Id)
1097 return TokError("expected class name after 'class' keyword");
1099 Record *CurRec = Records.getClass(Lex.getCurStrVal());
1101 // If the body was previously defined, this is an error.
1102 if (!CurRec->getValues().empty() ||
1103 !CurRec->getSuperClasses().empty() ||
1104 !CurRec->getTemplateArgs().empty())
1105 return TokError("Class '" + CurRec->getName() + "' already defined");
1107 // If this is the first reference to this class, create and add it.
1108 CurRec = new Record(Lex.getCurStrVal(), Lex.getLoc());
1109 Records.addClass(CurRec);
1111 Lex.Lex(); // eat the name.
1113 // If there are template args, parse them.
1114 if (Lex.getCode() == tgtok::less)
1115 if (ParseTemplateArgList(CurRec))
1118 // Finally, parse the object body.
1119 return ParseObjectBody(CurRec);
1122 /// ParseLetList - Parse a non-empty list of assignment expressions into a list
1125 /// LetList ::= LetItem (',' LetItem)*
1126 /// LetItem ::= ID OptionalRangeList '=' Value
1128 std::vector<LetRecord> TGParser::ParseLetList() {
1129 std::vector<LetRecord> Result;
1132 if (Lex.getCode() != tgtok::Id) {
1133 TokError("expected identifier in let definition");
1134 return std::vector<LetRecord>();
1136 std::string Name = Lex.getCurStrVal();
1137 TGLoc NameLoc = Lex.getLoc();
1138 Lex.Lex(); // Eat the identifier.
1140 // Check for an optional RangeList.
1141 std::vector<unsigned> Bits;
1142 if (ParseOptionalRangeList(Bits))
1143 return std::vector<LetRecord>();
1144 std::reverse(Bits.begin(), Bits.end());
1146 if (Lex.getCode() != tgtok::equal) {
1147 TokError("expected '=' in let expression");
1148 return std::vector<LetRecord>();
1150 Lex.Lex(); // eat the '='.
1152 Init *Val = ParseValue(0);
1153 if (Val == 0) return std::vector<LetRecord>();
1155 // Now that we have everything, add the record.
1156 Result.push_back(LetRecord(Name, Bits, Val, NameLoc));
1158 if (Lex.getCode() != tgtok::comma)
1160 Lex.Lex(); // eat the comma.
1164 /// ParseTopLevelLet - Parse a 'let' at top level. This can be a couple of
1165 /// different related productions.
1167 /// Object ::= LET LetList IN '{' ObjectList '}'
1168 /// Object ::= LET LetList IN Object
1170 bool TGParser::ParseTopLevelLet() {
1171 assert(Lex.getCode() == tgtok::Let && "Unexpected token");
1174 // Add this entry to the let stack.
1175 std::vector<LetRecord> LetInfo = ParseLetList();
1176 if (LetInfo.empty()) return true;
1177 LetStack.push_back(LetInfo);
1179 if (Lex.getCode() != tgtok::In)
1180 return TokError("expected 'in' at end of top-level 'let'");
1183 // If this is a scalar let, just handle it now
1184 if (Lex.getCode() != tgtok::l_brace) {
1185 // LET LetList IN Object
1188 } else { // Object ::= LETCommand '{' ObjectList '}'
1189 TGLoc BraceLoc = Lex.getLoc();
1190 // Otherwise, this is a group let.
1191 Lex.Lex(); // eat the '{'.
1193 // Parse the object list.
1194 if (ParseObjectList())
1197 if (Lex.getCode() != tgtok::r_brace) {
1198 TokError("expected '}' at end of top level let command");
1199 return Error(BraceLoc, "to match this '{'");
1204 // Outside this let scope, this let block is not active.
1205 LetStack.pop_back();
1209 /// ParseMultiClassDef - Parse a def in a multiclass context.
1211 /// MultiClassDef ::= DefInst
1213 bool TGParser::ParseMultiClassDef(MultiClass *CurMC) {
1214 if (Lex.getCode() != tgtok::Def)
1215 return TokError("expected 'def' in multiclass body");
1217 Record *D = ParseDef(CurMC);
1218 if (D == 0) return true;
1220 // Copy the template arguments for the multiclass into the def.
1221 const std::vector<std::string> &TArgs = CurMC->Rec.getTemplateArgs();
1223 for (unsigned i = 0, e = TArgs.size(); i != e; ++i) {
1224 const RecordVal *RV = CurMC->Rec.getValue(TArgs[i]);
1225 assert(RV && "Template arg doesn't exist?");
1232 /// ParseMultiClass - Parse a multiclass definition.
1234 /// MultiClassInst ::= MULTICLASS ID TemplateArgList? '{' MultiClassDef+ '}'
1236 bool TGParser::ParseMultiClass() {
1237 assert(Lex.getCode() == tgtok::MultiClass && "Unexpected token");
1238 Lex.Lex(); // Eat the multiclass token.
1240 if (Lex.getCode() != tgtok::Id)
1241 return TokError("expected identifier after multiclass for name");
1242 std::string Name = Lex.getCurStrVal();
1244 if (MultiClasses.count(Name))
1245 return TokError("multiclass '" + Name + "' already defined");
1247 CurMultiClass = MultiClasses[Name] = new MultiClass(Name, Lex.getLoc());
1248 Lex.Lex(); // Eat the identifier.
1250 // If there are template args, parse them.
1251 if (Lex.getCode() == tgtok::less)
1252 if (ParseTemplateArgList(0))
1255 if (Lex.getCode() != tgtok::l_brace)
1256 return TokError("expected '{' in multiclass definition");
1258 if (Lex.Lex() == tgtok::r_brace) // eat the '{'.
1259 return TokError("multiclass must contain at least one def");
1261 while (Lex.getCode() != tgtok::r_brace)
1262 if (ParseMultiClassDef(CurMultiClass))
1265 Lex.Lex(); // eat the '}'.
1271 /// ParseDefm - Parse the instantiation of a multiclass.
1273 /// DefMInst ::= DEFM ID ':' DefmSubClassRef ';'
1275 bool TGParser::ParseDefm() {
1276 assert(Lex.getCode() == tgtok::Defm && "Unexpected token!");
1277 if (Lex.Lex() != tgtok::Id) // eat the defm.
1278 return TokError("expected identifier after defm");
1280 TGLoc DefmPrefixLoc = Lex.getLoc();
1281 std::string DefmPrefix = Lex.getCurStrVal();
1282 if (Lex.Lex() != tgtok::colon)
1283 return TokError("expected ':' after defm identifier");
1288 TGLoc SubClassLoc = Lex.getLoc();
1289 SubClassReference Ref = ParseSubClassReference(0, true);
1290 if (Ref.Rec == 0) return true;
1292 if (Lex.getCode() != tgtok::semi)
1293 return TokError("expected ';' at end of defm");
1296 // To instantiate a multiclass, we need to first get the multiclass, then
1297 // instantiate each def contained in the multiclass with the SubClassRef
1298 // template parameters.
1299 MultiClass *MC = MultiClasses[Ref.Rec->getName()];
1300 assert(MC && "Didn't lookup multiclass correctly?");
1301 std::vector<Init*> &TemplateVals = Ref.TemplateArgs;
1303 // Verify that the correct number of template arguments were specified.
1304 const std::vector<std::string> &TArgs = MC->Rec.getTemplateArgs();
1305 if (TArgs.size() < TemplateVals.size())
1306 return Error(SubClassLoc,
1307 "more template args specified than multiclass expects");
1309 // Loop over all the def's in the multiclass, instantiating each one.
1310 for (unsigned i = 0, e = MC->DefPrototypes.size(); i != e; ++i) {
1311 Record *DefProto = MC->DefPrototypes[i];
1313 // Add the suffix to the defm name to get the new name.
1314 Record *CurRec = new Record(DefmPrefix + DefProto->getName(),DefmPrefixLoc);
1316 SubClassReference Ref;
1317 Ref.RefLoc = DefmPrefixLoc;
1319 AddSubClass(CurRec, Ref);
1321 // Loop over all of the template arguments, setting them to the specified
1322 // value or leaving them as the default if necessary.
1323 for (unsigned i = 0, e = TArgs.size(); i != e; ++i) {
1324 if (i < TemplateVals.size()) { // A value is specified for this temp-arg?
1326 if (SetValue(CurRec, DefmPrefixLoc, TArgs[i], std::vector<unsigned>(),
1331 CurRec->resolveReferencesTo(CurRec->getValue(TArgs[i]));
1334 CurRec->removeValue(TArgs[i]);
1336 } else if (!CurRec->getValue(TArgs[i])->getValue()->isComplete()) {
1337 return Error(SubClassLoc, "value not specified for template argument #"+
1338 utostr(i) + " (" + TArgs[i] + ") of multiclassclass '" +
1339 MC->Rec.getName() + "'");
1343 // If the mdef is inside a 'let' expression, add to each def.
1344 for (unsigned i = 0, e = LetStack.size(); i != e; ++i)
1345 for (unsigned j = 0, e = LetStack[i].size(); j != e; ++j)
1346 if (SetValue(CurRec, LetStack[i][j].Loc, LetStack[i][j].Name,
1347 LetStack[i][j].Bits, LetStack[i][j].Value)) {
1348 Error(DefmPrefixLoc, "when instantiating this defm");
1353 // Ensure redefinition doesn't happen.
1354 if (Records.getDef(CurRec->getName()))
1355 return Error(DefmPrefixLoc, "def '" + CurRec->getName() +
1356 "' already defined, instantiating defm with subdef '" +
1357 DefProto->getName() + "'");
1358 Records.addDef(CurRec);
1359 CurRec->resolveReferences();
1366 /// Object ::= ClassInst
1367 /// Object ::= DefInst
1368 /// Object ::= MultiClassInst
1369 /// Object ::= DefMInst
1370 /// Object ::= LETCommand '{' ObjectList '}'
1371 /// Object ::= LETCommand Object
1372 bool TGParser::ParseObject() {
1373 switch (Lex.getCode()) {
1374 default: assert(0 && "This is not an object");
1375 case tgtok::Let: return ParseTopLevelLet();
1376 case tgtok::Def: return ParseDef(0) == 0;
1377 case tgtok::Defm: return ParseDefm();
1378 case tgtok::Class: return ParseClass();
1379 case tgtok::MultiClass: return ParseMultiClass();
1384 /// ObjectList :== Object*
1385 bool TGParser::ParseObjectList() {
1386 while (isObjectStart(Lex.getCode())) {
1394 bool TGParser::ParseFile() {
1395 Lex.Lex(); // Prime the lexer.
1396 if (ParseObjectList()) return true;
1398 // If we have unread input at the end of the file, report it.
1399 if (Lex.getCode() == tgtok::Eof)
1402 return TokError("Unexpected input at top level");