RegexTest.cpp 5.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181
  1. //===- llvm/unittest/Support/RegexTest.cpp - Regex tests --===//
  2. //
  3. // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
  4. // See https://llvm.org/LICENSE.txt for license information.
  5. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  6. //
  7. //===----------------------------------------------------------------------===//
  8. #include "llvm/Support/Regex.h"
  9. #include "llvm/ADT/SmallVector.h"
  10. #include "gtest/gtest.h"
  11. #include <cstring>
  12. using namespace llvm;
  13. namespace {
  14. class RegexTest : public ::testing::Test {
  15. };
  16. TEST_F(RegexTest, Basics) {
  17. Regex r1("^[0-9]+$");
  18. EXPECT_TRUE(r1.match("916"));
  19. EXPECT_TRUE(r1.match("9"));
  20. EXPECT_FALSE(r1.match("9a"));
  21. SmallVector<StringRef, 1> Matches;
  22. Regex r2("[0-9]+");
  23. EXPECT_TRUE(r2.match("aa216b", &Matches));
  24. EXPECT_EQ(1u, Matches.size());
  25. EXPECT_EQ("216", Matches[0].str());
  26. Regex r3("[0-9]+([a-f])?:([0-9]+)");
  27. EXPECT_TRUE(r3.match("9a:513b", &Matches));
  28. EXPECT_EQ(3u, Matches.size());
  29. EXPECT_EQ("9a:513", Matches[0].str());
  30. EXPECT_EQ("a", Matches[1].str());
  31. EXPECT_EQ("513", Matches[2].str());
  32. EXPECT_TRUE(r3.match("9:513b", &Matches));
  33. EXPECT_EQ(3u, Matches.size());
  34. EXPECT_EQ("9:513", Matches[0].str());
  35. EXPECT_EQ("", Matches[1].str());
  36. EXPECT_EQ("513", Matches[2].str());
  37. Regex r4("a[^b]+b");
  38. std::string String="axxb";
  39. String[2] = '\0';
  40. EXPECT_FALSE(r4.match("abb"));
  41. EXPECT_TRUE(r4.match(String, &Matches));
  42. EXPECT_EQ(1u, Matches.size());
  43. EXPECT_EQ(String, Matches[0].str());
  44. std::string NulPattern="X[0-9]+X([a-f])?:([0-9]+)";
  45. String="YX99a:513b";
  46. NulPattern[7] = '\0';
  47. Regex r5(NulPattern);
  48. EXPECT_FALSE(r5.match(String));
  49. EXPECT_FALSE(r5.match("X9"));
  50. String[3]='\0';
  51. EXPECT_TRUE(r5.match(String));
  52. }
  53. TEST_F(RegexTest, Backreferences) {
  54. Regex r1("([a-z]+)_\\1");
  55. SmallVector<StringRef, 4> Matches;
  56. EXPECT_TRUE(r1.match("abc_abc", &Matches));
  57. EXPECT_EQ(2u, Matches.size());
  58. EXPECT_FALSE(r1.match("abc_ab", &Matches));
  59. Regex r2("a([0-9])b\\1c\\1");
  60. EXPECT_TRUE(r2.match("a4b4c4", &Matches));
  61. EXPECT_EQ(2u, Matches.size());
  62. EXPECT_EQ("4", Matches[1].str());
  63. EXPECT_FALSE(r2.match("a2b2c3"));
  64. Regex r3("a([0-9])([a-z])b\\1\\2");
  65. EXPECT_TRUE(r3.match("a6zb6z", &Matches));
  66. EXPECT_EQ(3u, Matches.size());
  67. EXPECT_EQ("6", Matches[1].str());
  68. EXPECT_EQ("z", Matches[2].str());
  69. EXPECT_FALSE(r3.match("a6zb6y"));
  70. EXPECT_FALSE(r3.match("a6zb7z"));
  71. }
  72. TEST_F(RegexTest, Substitution) {
  73. std::string Error;
  74. EXPECT_EQ("aNUMber", Regex("[0-9]+").sub("NUM", "a1234ber"));
  75. // Standard Escapes
  76. EXPECT_EQ("a\\ber", Regex("[0-9]+").sub("\\\\", "a1234ber", &Error));
  77. EXPECT_EQ("", Error);
  78. EXPECT_EQ("a\nber", Regex("[0-9]+").sub("\\n", "a1234ber", &Error));
  79. EXPECT_EQ("", Error);
  80. EXPECT_EQ("a\tber", Regex("[0-9]+").sub("\\t", "a1234ber", &Error));
  81. EXPECT_EQ("", Error);
  82. EXPECT_EQ("ajber", Regex("[0-9]+").sub("\\j", "a1234ber", &Error));
  83. EXPECT_EQ("", Error);
  84. EXPECT_EQ("aber", Regex("[0-9]+").sub("\\", "a1234ber", &Error));
  85. EXPECT_EQ(Error, "replacement string contained trailing backslash");
  86. // Backreferences
  87. EXPECT_EQ("aa1234bber", Regex("a[0-9]+b").sub("a\\0b", "a1234ber", &Error));
  88. EXPECT_EQ("", Error);
  89. EXPECT_EQ("a1234ber", Regex("a([0-9]+)b").sub("a\\1b", "a1234ber", &Error));
  90. EXPECT_EQ("", Error);
  91. EXPECT_EQ("aber", Regex("a[0-9]+b").sub("a\\100b", "a1234ber", &Error));
  92. EXPECT_EQ(Error, "invalid backreference string '100'");
  93. }
  94. TEST_F(RegexTest, IsLiteralERE) {
  95. EXPECT_TRUE(Regex::isLiteralERE("abc"));
  96. EXPECT_FALSE(Regex::isLiteralERE("a(bc)"));
  97. EXPECT_FALSE(Regex::isLiteralERE("^abc"));
  98. EXPECT_FALSE(Regex::isLiteralERE("abc$"));
  99. EXPECT_FALSE(Regex::isLiteralERE("a|bc"));
  100. EXPECT_FALSE(Regex::isLiteralERE("abc*"));
  101. EXPECT_FALSE(Regex::isLiteralERE("abc+"));
  102. EXPECT_FALSE(Regex::isLiteralERE("abc?"));
  103. EXPECT_FALSE(Regex::isLiteralERE("abc."));
  104. EXPECT_FALSE(Regex::isLiteralERE("a[bc]"));
  105. EXPECT_FALSE(Regex::isLiteralERE("abc\\1"));
  106. EXPECT_FALSE(Regex::isLiteralERE("abc{1,2}"));
  107. }
  108. TEST_F(RegexTest, Escape) {
  109. EXPECT_EQ("a\\[bc\\]", Regex::escape("a[bc]"));
  110. EXPECT_EQ("abc\\{1\\\\,2\\}", Regex::escape("abc{1\\,2}"));
  111. }
  112. TEST_F(RegexTest, IsValid) {
  113. std::string Error;
  114. EXPECT_FALSE(Regex("(foo").isValid(Error));
  115. EXPECT_EQ("parentheses not balanced", Error);
  116. EXPECT_FALSE(Regex("a[b-").isValid(Error));
  117. EXPECT_EQ("invalid character range", Error);
  118. }
  119. TEST_F(RegexTest, MoveConstruct) {
  120. Regex r1("^[0-9]+$");
  121. Regex r2(std::move(r1));
  122. EXPECT_TRUE(r2.match("916"));
  123. }
  124. TEST_F(RegexTest, MoveAssign) {
  125. Regex r1("^[0-9]+$");
  126. Regex r2("abc");
  127. r2 = std::move(r1);
  128. EXPECT_TRUE(r2.match("916"));
  129. std::string Error;
  130. EXPECT_FALSE(r1.isValid(Error));
  131. }
  132. TEST_F(RegexTest, NoArgConstructor) {
  133. std::string Error;
  134. Regex r1;
  135. EXPECT_FALSE(r1.isValid(Error));
  136. EXPECT_EQ("invalid regular expression", Error);
  137. r1 = Regex("abc");
  138. EXPECT_TRUE(r1.isValid(Error));
  139. }
  140. TEST_F(RegexTest, MatchInvalid) {
  141. Regex r1;
  142. std::string Error;
  143. EXPECT_FALSE(r1.isValid(Error));
  144. EXPECT_FALSE(r1.match("X"));
  145. }
  146. // https://bugs.chromium.org/p/oss-fuzz/issues/detail?id=3727
  147. TEST_F(RegexTest, OssFuzz3727Regression) {
  148. // Wrap in a StringRef so the NUL byte doesn't terminate the string
  149. Regex r(StringRef("[[[=GS\x00[=][", 10));
  150. std::string Error;
  151. EXPECT_FALSE(r.isValid(Error));
  152. }
  153. }