Add a !regmatch operator to do pattern matching in TableGen.

author David Greene <greened@obbligato.org>

Mon, 8 Jun 2009 17:00:34 +0000 (17:00 +0000)

committer David Greene <greened@obbligato.org>

Mon, 8 Jun 2009 17:00:34 +0000 (17:00 +0000)
author David Greene <greened@obbligato.org>
Mon, 8 Jun 2009 17:00:34 +0000 (17:00 +0000)
committer David Greene <greened@obbligato.org>
Mon, 8 Jun 2009 17:00:34 +0000 (17:00 +0000)
diff --git a/docs/TableGenFundamentals.html b/docs/TableGenFundamentals.html

index bd427116a163ce1b7cf3099af1e611fa390fe77b..2e74352010f4198ed03f503a0c7f5521170c4c8b 100644 (file)
--- a/docs/TableGenFundamentals.html
+++ b/docs/TableGenFundamentals.html
@@ -414,6 +414,9 @@ aborts with an error. </dd>
  <dt><tt>!subst(a, b, c)</tt></dt>
    <dd>If 'a' and 'b' are of string type or are symbol references, substitute 
  'b' for 'a' in 'c.'  This operation is analogous to $(subst) in GNU make.</dd>
+<dt><tt>!regmatch(a, b)</tt></dt>
+  <dd>An integer {0,1} indicating whether string 'b' matched regular expression
+'a.'</dd>
  <dt><tt>!foreach(a, b, c)</tt></dt>
    <dd>For each member 'b' of dag or list 'a' apply operator 'c.'  'b' is a 
  dummy variable that should be declared as a member variable of an instantiated 
diff --git a/test/TableGen/regmatch.td b/test/TableGen/regmatch.td

new file mode 100644 (file)

index 0000000..3eb35df
--- /dev/null
+++ b/test/TableGen/regmatch.td
@@ -0,0 +1,11 @@
+// RUN: tblgen %s | grep {Match1 = 1} | count 1
+// RUN: tblgen %s | grep {Match2 = 1} | count 1
+
+class Foo<string v> {
+      string Value = v;
+      int Match1 = !regmatch(".*ps$", v);
+      int Match2 = !regmatch(".*pd$", v);
+}
+
+def Bar : Foo<"addps">;
+def Baz : Foo<"addpd">;
diff --git a/utils/TableGen/Record.cpp b/utils/TableGen/Record.cpp

index 45804b938cb20ad6a886b946c60c18071d8ff168..47cab7b5db8b36e40d46f3b7f09332e4d438dfad 100644 (file)
--- a/utils/TableGen/Record.cpp
+++ b/utils/TableGen/Record.cpp
@@ -16,6 +16,8 @@
  #include "llvm/Support/Streams.h"
  #include "llvm/ADT/StringExtras.h"
  #include <ios>
+#include <sys/types.h>
+#include <regex.h>
  
  using namespace llvm;
  
@@ -671,6 +673,36 @@ Init *BinOpInit::Fold(Record *CurRec, MultiClass *CurMultiClass) {
      }
      break;
    }
+  case REGMATCH: {
+    StringInit *LHSs = dynamic_cast<StringInit*>(LHS);
+    StringInit *RHSs = dynamic_cast<StringInit*>(RHS);
+    if (LHSs && RHSs) {
+      regex_t compiled;
+      int err = regcomp (&compiled, LHSs->getValue().c_str(), REG_EXTENDED);
+      if (err != 0) {
+        size_t length = regerror (err, &compiled, NULL, 0);
+        char *buffer = new char[length];
+        (void) regerror (err, &compiled, buffer, length);
+        std::string errmsg = buffer;
+        delete[] buffer;
+        regfree(&compiled);
+        throw errmsg;
+      }
+      int result = regexec(&compiled, RHSs->getValue().c_str(), 0, NULL, 0);
+      if (result == REG_ESPACE) {
+        size_t length = regerror (err, &compiled, NULL, 0);
+        char *buffer = new char[length];
+        (void) regerror (err, &compiled, buffer, length);
+        std::string errmsg = buffer;
+        delete[] buffer;
+        regfree(&compiled);
+        throw errmsg;
+      }
+      regfree(&compiled);
+      return new IntInit(result == 0);
+    }    
+    break;
+  }
    case SHL:
    case SRA:
    case SRL: {
@@ -710,6 +742,7 @@ std::string BinOpInit::getAsString() const {
    case SRA: Result = "!sra"; break;
    case SRL: Result = "!srl"; break;
    case STRCONCAT: Result = "!strconcat"; break;
+  case REGMATCH: Result = "!regmatch"; break;
    case NAMECONCAT: 
      Result = "!nameconcat<" + getType()->getAsString() + ">"; break;
    }
diff --git a/utils/TableGen/Record.h b/utils/TableGen/Record.h

index 4284cabf85579b6fd753d931571e516fc209a12a..3a15ca5767fdbee5fdb973d351b6b4231cf3554f 100644 (file)
--- a/utils/TableGen/Record.h
+++ b/utils/TableGen/Record.h
@@ -802,7 +802,7 @@ public:
  ///
  class BinOpInit : public OpInit {
  public:
-  enum BinaryOp { SHL, SRA, SRL, STRCONCAT, CONCAT, NAMECONCAT };
+  enum BinaryOp { SHL, SRA, SRL, STRCONCAT, CONCAT, NAMECONCAT, REGMATCH };
  private:
    BinaryOp Opc;
    Init *LHS, *RHS;
diff --git a/utils/TableGen/TGLexer.cpp b/utils/TableGen/TGLexer.cpp

index 758d499a8b5f317a40417555a72f871f8d5bebd4..378bffb3d2eea0803a5d12d136347ca2f3cab7c9 100644 (file)
--- a/utils/TableGen/TGLexer.cpp
+++ b/utils/TableGen/TGLexer.cpp
@@ -447,6 +447,7 @@ tgtok::TokKind TGLexer::LexExclaim() {
    if (Len == 3  && !memcmp(Start, "shl", 3)) return tgtok::XSHL;
    if (Len == 9  && !memcmp(Start, "strconcat", 9))   return tgtok::XStrConcat;
    if (Len == 10 && !memcmp(Start, "nameconcat", 10)) return tgtok::XNameConcat;
+  if (Len == 8 && !memcmp(Start, "regmatch", 8)) return tgtok::XRegMatch;
    if (Len == 5 && !memcmp(Start, "subst", 5)) return tgtok::XSubst;
    if (Len == 7 && !memcmp(Start, "foreach", 7)) return tgtok::XForEach;
    if (Len == 4 && !memcmp(Start, "cast", 4)) return tgtok::XCast;
diff --git a/utils/TableGen/TGLexer.h b/utils/TableGen/TGLexer.h

index ac3b9840039b2fa2dd9738e88c40b5b84cbb713f..06f6535949ec2022841be6b65941b36b78826d95 100644 (file)
--- a/utils/TableGen/TGLexer.h
+++ b/utils/TableGen/TGLexer.h
@@ -46,7 +46,7 @@ namespace tgtok {
      
      // !keywords.
      XConcat, XSRA, XSRL, XSHL, XStrConcat, XNameConcat, XCast, XSubst,
-    XForEach, XCar, XCdr, XNull, XIf,
+    XForEach, XCar, XCdr, XNull, XIf, XRegMatch,
  
      // Integer value.
      IntVal,
diff --git a/utils/TableGen/TGParser.cpp b/utils/TableGen/TGParser.cpp

index fc6f29fd9f1b5a17fc458445119522e992391b22..b4d448b1e8c087af0a97e1eea85b6e87750e98fe 100644 (file)
--- a/utils/TableGen/TGParser.cpp
+++ b/utils/TableGen/TGParser.cpp
@@ -791,6 +791,7 @@ Init *TGParser::ParseOperation(Record *CurRec) {
    case tgtok::XSRL:
    case tgtok::XSHL:
    case tgtok::XStrConcat:
+  case tgtok::XRegMatch:
    case tgtok::XNameConcat: {  // Value ::= !binop '(' Value ',' Value ')'
      BinOpInit::BinaryOp Code;
      RecTy *Type = 0;
@@ -823,6 +824,11 @@ Init *TGParser::ParseOperation(Record *CurRec) {
        Code = BinOpInit::STRCONCAT;
        Type = new StringRecTy();
        break;
+    case tgtok::XRegMatch:  
+      Lex.Lex();  // eat the operation
+      Code = BinOpInit::REGMATCH;
+      Type = new IntRecTy();
+      break;
      case tgtok::XNameConcat: 
        Lex.Lex();  // eat the operation
        Code = BinOpInit::NAMECONCAT;
@@ -1174,6 +1180,7 @@ Init *TGParser::ParseSimpleValue(Record *CurRec) {
    case tgtok::XSRL:
    case tgtok::XSHL:
    case tgtok::XStrConcat:
+  case tgtok::XRegMatch:
    case tgtok::XNameConcat:  // Value ::= !binop '(' Value ',' Value ')'
    case tgtok::XIf:
    case tgtok::XForEach:
author	David Greene <greened@obbligato.org>
	Mon, 8 Jun 2009 17:00:34 +0000 (17:00 +0000)
committer	David Greene <greened@obbligato.org>
	Mon, 8 Jun 2009 17:00:34 +0000 (17:00 +0000)
docs/TableGenFundamentals.html		patch \| blob \| history
test/TableGen/regmatch.td	[new file with mode: 0644]	patch \| blob
utils/TableGen/Record.cpp		patch \| blob \| history
utils/TableGen/Record.h		patch \| blob \| history
utils/TableGen/TGLexer.cpp		patch \| blob \| history
utils/TableGen/TGLexer.h		patch \| blob \| history
utils/TableGen/TGParser.cpp		patch \| blob \| history