From aa80e61b0d79ddf9593f6217063574d0c66c3099 Mon Sep 17 00:00:00 2001 From: Peter Collingbourne Date: Mon, 5 Aug 2013 17:47:59 +0000 Subject: [PATCH] Introduce Regex::isLiteralERE function. This will be used to implement an optimisation for literal entries in special case lists. Differential Revision: http://llvm-reviews.chandlerc.com/D1278 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@187731 91177308-0d34-0410-b5e6-96231b3b80d8 --- include/llvm/Support/Regex.h | 4 ++++ lib/Support/Regex.cpp | 7 +++++++ unittests/Support/RegexTest.cpp | 15 +++++++++++++++ 3 files changed, 26 insertions(+) diff --git a/include/llvm/Support/Regex.h b/include/llvm/Support/Regex.h index 82df2c67bd0..3d071bedbd8 100644 --- a/include/llvm/Support/Regex.h +++ b/include/llvm/Support/Regex.h @@ -77,6 +77,10 @@ namespace llvm { /// string. std::string sub(StringRef Repl, StringRef String, std::string *Error = 0); + /// \brief If this function returns true, ^Str$ is an extended regular + /// expression that matches Str and only Str. + static bool isLiteralERE(StringRef Str); + private: struct llvm_regex *preg; int error; diff --git a/lib/Support/Regex.cpp b/lib/Support/Regex.cpp index efc8b90a009..dec967e33f5 100644 --- a/lib/Support/Regex.cpp +++ b/lib/Support/Regex.cpp @@ -168,3 +168,10 @@ std::string Regex::sub(StringRef Repl, StringRef String, return Res; } + +bool Regex::isLiteralERE(StringRef Str) { + // Check for regex metacharacters. This list was derived from our regex + // implementation in regcomp.c and double checked against the POSIX extended + // regular expression specification. + return Str.find_first_of("()^$|*+?.[]\\{}") == StringRef::npos; +} diff --git a/unittests/Support/RegexTest.cpp b/unittests/Support/RegexTest.cpp index 3577d1015e9..02869b3ed46 100644 --- a/unittests/Support/RegexTest.cpp +++ b/unittests/Support/RegexTest.cpp @@ -112,4 +112,19 @@ TEST_F(RegexTest, Substitution) { EXPECT_EQ(Error, "invalid backreference string '100'"); } +TEST_F(RegexTest, IsLiteralERE) { + EXPECT_TRUE(Regex::isLiteralERE("abc")); + EXPECT_FALSE(Regex::isLiteralERE("a(bc)")); + EXPECT_FALSE(Regex::isLiteralERE("^abc")); + EXPECT_FALSE(Regex::isLiteralERE("abc$")); + EXPECT_FALSE(Regex::isLiteralERE("a|bc")); + EXPECT_FALSE(Regex::isLiteralERE("abc*")); + EXPECT_FALSE(Regex::isLiteralERE("abc+")); + EXPECT_FALSE(Regex::isLiteralERE("abc?")); + EXPECT_FALSE(Regex::isLiteralERE("abc.")); + EXPECT_FALSE(Regex::isLiteralERE("a[bc]")); + EXPECT_FALSE(Regex::isLiteralERE("abc\\1")); + EXPECT_FALSE(Regex::isLiteralERE("abc{1,2}")); +} + } -- 2.34.1