1f4a2713aSLionel Sambuc //===- llvm/unittest/Support/RegexTest.cpp - Regex tests --===//
2f4a2713aSLionel Sambuc //
3f4a2713aSLionel Sambuc // The LLVM Compiler Infrastructure
4f4a2713aSLionel Sambuc //
5f4a2713aSLionel Sambuc // This file is distributed under the University of Illinois Open Source
6f4a2713aSLionel Sambuc // License. See LICENSE.TXT for details.
7f4a2713aSLionel Sambuc //
8f4a2713aSLionel Sambuc //===----------------------------------------------------------------------===//
9f4a2713aSLionel Sambuc
10f4a2713aSLionel Sambuc #include "llvm/Support/Regex.h"
11f4a2713aSLionel Sambuc #include "llvm/ADT/SmallVector.h"
12f4a2713aSLionel Sambuc #include "gtest/gtest.h"
13f4a2713aSLionel Sambuc #include <cstring>
14f4a2713aSLionel Sambuc
15f4a2713aSLionel Sambuc using namespace llvm;
16f4a2713aSLionel Sambuc namespace {
17f4a2713aSLionel Sambuc
18f4a2713aSLionel Sambuc class RegexTest : public ::testing::Test {
19f4a2713aSLionel Sambuc };
20f4a2713aSLionel Sambuc
TEST_F(RegexTest,Basics)21f4a2713aSLionel Sambuc TEST_F(RegexTest, Basics) {
22f4a2713aSLionel Sambuc Regex r1("^[0-9]+$");
23f4a2713aSLionel Sambuc EXPECT_TRUE(r1.match("916"));
24f4a2713aSLionel Sambuc EXPECT_TRUE(r1.match("9"));
25f4a2713aSLionel Sambuc EXPECT_FALSE(r1.match("9a"));
26f4a2713aSLionel Sambuc
27f4a2713aSLionel Sambuc SmallVector<StringRef, 1> Matches;
28f4a2713aSLionel Sambuc Regex r2("[0-9]+");
29f4a2713aSLionel Sambuc EXPECT_TRUE(r2.match("aa216b", &Matches));
30f4a2713aSLionel Sambuc EXPECT_EQ(1u, Matches.size());
31f4a2713aSLionel Sambuc EXPECT_EQ("216", Matches[0].str());
32f4a2713aSLionel Sambuc
33f4a2713aSLionel Sambuc Regex r3("[0-9]+([a-f])?:([0-9]+)");
34f4a2713aSLionel Sambuc EXPECT_TRUE(r3.match("9a:513b", &Matches));
35f4a2713aSLionel Sambuc EXPECT_EQ(3u, Matches.size());
36f4a2713aSLionel Sambuc EXPECT_EQ("9a:513", Matches[0].str());
37f4a2713aSLionel Sambuc EXPECT_EQ("a", Matches[1].str());
38f4a2713aSLionel Sambuc EXPECT_EQ("513", Matches[2].str());
39f4a2713aSLionel Sambuc
40f4a2713aSLionel Sambuc EXPECT_TRUE(r3.match("9:513b", &Matches));
41f4a2713aSLionel Sambuc EXPECT_EQ(3u, Matches.size());
42f4a2713aSLionel Sambuc EXPECT_EQ("9:513", Matches[0].str());
43f4a2713aSLionel Sambuc EXPECT_EQ("", Matches[1].str());
44f4a2713aSLionel Sambuc EXPECT_EQ("513", Matches[2].str());
45f4a2713aSLionel Sambuc
46f4a2713aSLionel Sambuc Regex r4("a[^b]+b");
47f4a2713aSLionel Sambuc std::string String="axxb";
48f4a2713aSLionel Sambuc String[2] = '\0';
49f4a2713aSLionel Sambuc EXPECT_FALSE(r4.match("abb"));
50f4a2713aSLionel Sambuc EXPECT_TRUE(r4.match(String, &Matches));
51f4a2713aSLionel Sambuc EXPECT_EQ(1u, Matches.size());
52f4a2713aSLionel Sambuc EXPECT_EQ(String, Matches[0].str());
53f4a2713aSLionel Sambuc
54f4a2713aSLionel Sambuc std::string NulPattern="X[0-9]+X([a-f])?:([0-9]+)";
55f4a2713aSLionel Sambuc String="YX99a:513b";
56f4a2713aSLionel Sambuc NulPattern[7] = '\0';
57f4a2713aSLionel Sambuc Regex r5(NulPattern);
58f4a2713aSLionel Sambuc EXPECT_FALSE(r5.match(String));
59f4a2713aSLionel Sambuc EXPECT_FALSE(r5.match("X9"));
60f4a2713aSLionel Sambuc String[3]='\0';
61f4a2713aSLionel Sambuc EXPECT_TRUE(r5.match(String));
62f4a2713aSLionel Sambuc }
63f4a2713aSLionel Sambuc
TEST_F(RegexTest,Backreferences)64f4a2713aSLionel Sambuc TEST_F(RegexTest, Backreferences) {
65f4a2713aSLionel Sambuc Regex r1("([a-z]+)_\\1");
66f4a2713aSLionel Sambuc SmallVector<StringRef, 4> Matches;
67f4a2713aSLionel Sambuc EXPECT_TRUE(r1.match("abc_abc", &Matches));
68f4a2713aSLionel Sambuc EXPECT_EQ(2u, Matches.size());
69f4a2713aSLionel Sambuc EXPECT_FALSE(r1.match("abc_ab", &Matches));
70f4a2713aSLionel Sambuc
71f4a2713aSLionel Sambuc Regex r2("a([0-9])b\\1c\\1");
72f4a2713aSLionel Sambuc EXPECT_TRUE(r2.match("a4b4c4", &Matches));
73f4a2713aSLionel Sambuc EXPECT_EQ(2u, Matches.size());
74f4a2713aSLionel Sambuc EXPECT_EQ("4", Matches[1].str());
75f4a2713aSLionel Sambuc EXPECT_FALSE(r2.match("a2b2c3"));
76f4a2713aSLionel Sambuc
77f4a2713aSLionel Sambuc Regex r3("a([0-9])([a-z])b\\1\\2");
78f4a2713aSLionel Sambuc EXPECT_TRUE(r3.match("a6zb6z", &Matches));
79f4a2713aSLionel Sambuc EXPECT_EQ(3u, Matches.size());
80f4a2713aSLionel Sambuc EXPECT_EQ("6", Matches[1].str());
81f4a2713aSLionel Sambuc EXPECT_EQ("z", Matches[2].str());
82f4a2713aSLionel Sambuc EXPECT_FALSE(r3.match("a6zb6y"));
83f4a2713aSLionel Sambuc EXPECT_FALSE(r3.match("a6zb7z"));
84f4a2713aSLionel Sambuc }
85f4a2713aSLionel Sambuc
TEST_F(RegexTest,Substitution)86f4a2713aSLionel Sambuc TEST_F(RegexTest, Substitution) {
87f4a2713aSLionel Sambuc std::string Error;
88f4a2713aSLionel Sambuc
89f4a2713aSLionel Sambuc EXPECT_EQ("aNUMber", Regex("[0-9]+").sub("NUM", "a1234ber"));
90f4a2713aSLionel Sambuc
91f4a2713aSLionel Sambuc // Standard Escapes
92f4a2713aSLionel Sambuc EXPECT_EQ("a\\ber", Regex("[0-9]+").sub("\\\\", "a1234ber", &Error));
93*0a6a1f1dSLionel Sambuc EXPECT_EQ("", Error);
94f4a2713aSLionel Sambuc EXPECT_EQ("a\nber", Regex("[0-9]+").sub("\\n", "a1234ber", &Error));
95*0a6a1f1dSLionel Sambuc EXPECT_EQ("", Error);
96f4a2713aSLionel Sambuc EXPECT_EQ("a\tber", Regex("[0-9]+").sub("\\t", "a1234ber", &Error));
97*0a6a1f1dSLionel Sambuc EXPECT_EQ("", Error);
98f4a2713aSLionel Sambuc EXPECT_EQ("ajber", Regex("[0-9]+").sub("\\j", "a1234ber", &Error));
99*0a6a1f1dSLionel Sambuc EXPECT_EQ("", Error);
100f4a2713aSLionel Sambuc
101f4a2713aSLionel Sambuc EXPECT_EQ("aber", Regex("[0-9]+").sub("\\", "a1234ber", &Error));
102f4a2713aSLionel Sambuc EXPECT_EQ(Error, "replacement string contained trailing backslash");
103f4a2713aSLionel Sambuc
104f4a2713aSLionel Sambuc // Backreferences
105f4a2713aSLionel Sambuc EXPECT_EQ("aa1234bber", Regex("a[0-9]+b").sub("a\\0b", "a1234ber", &Error));
106*0a6a1f1dSLionel Sambuc EXPECT_EQ("", Error);
107f4a2713aSLionel Sambuc
108f4a2713aSLionel Sambuc EXPECT_EQ("a1234ber", Regex("a([0-9]+)b").sub("a\\1b", "a1234ber", &Error));
109*0a6a1f1dSLionel Sambuc EXPECT_EQ("", Error);
110f4a2713aSLionel Sambuc
111f4a2713aSLionel Sambuc EXPECT_EQ("aber", Regex("a[0-9]+b").sub("a\\100b", "a1234ber", &Error));
112f4a2713aSLionel Sambuc EXPECT_EQ(Error, "invalid backreference string '100'");
113f4a2713aSLionel Sambuc }
114f4a2713aSLionel Sambuc
TEST_F(RegexTest,IsLiteralERE)115f4a2713aSLionel Sambuc TEST_F(RegexTest, IsLiteralERE) {
116f4a2713aSLionel Sambuc EXPECT_TRUE(Regex::isLiteralERE("abc"));
117f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("a(bc)"));
118f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("^abc"));
119f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("abc$"));
120f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("a|bc"));
121f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("abc*"));
122f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("abc+"));
123f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("abc?"));
124f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("abc."));
125f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("a[bc]"));
126f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("abc\\1"));
127f4a2713aSLionel Sambuc EXPECT_FALSE(Regex::isLiteralERE("abc{1,2}"));
128f4a2713aSLionel Sambuc }
129f4a2713aSLionel Sambuc
TEST_F(RegexTest,Escape)130*0a6a1f1dSLionel Sambuc TEST_F(RegexTest, Escape) {
131*0a6a1f1dSLionel Sambuc EXPECT_EQ("a\\[bc\\]", Regex::escape("a[bc]"));
132*0a6a1f1dSLionel Sambuc EXPECT_EQ("abc\\{1\\\\,2\\}", Regex::escape("abc{1\\,2}"));
133*0a6a1f1dSLionel Sambuc }
134*0a6a1f1dSLionel Sambuc
TEST_F(RegexTest,IsValid)135f4a2713aSLionel Sambuc TEST_F(RegexTest, IsValid) {
136f4a2713aSLionel Sambuc std::string Error;
137f4a2713aSLionel Sambuc EXPECT_FALSE(Regex("(foo").isValid(Error));
138f4a2713aSLionel Sambuc EXPECT_EQ("parentheses not balanced", Error);
139f4a2713aSLionel Sambuc EXPECT_FALSE(Regex("a[b-").isValid(Error));
140f4a2713aSLionel Sambuc EXPECT_EQ("invalid character range", Error);
141f4a2713aSLionel Sambuc }
142f4a2713aSLionel Sambuc
TEST_F(RegexTest,MoveConstruct)143*0a6a1f1dSLionel Sambuc TEST_F(RegexTest, MoveConstruct) {
144*0a6a1f1dSLionel Sambuc Regex r1("^[0-9]+$");
145*0a6a1f1dSLionel Sambuc Regex r2(std::move(r1));
146*0a6a1f1dSLionel Sambuc EXPECT_TRUE(r2.match("916"));
147*0a6a1f1dSLionel Sambuc }
148*0a6a1f1dSLionel Sambuc
TEST_F(RegexTest,MoveAssign)149*0a6a1f1dSLionel Sambuc TEST_F(RegexTest, MoveAssign) {
150*0a6a1f1dSLionel Sambuc Regex r1("^[0-9]+$");
151*0a6a1f1dSLionel Sambuc Regex r2("abc");
152*0a6a1f1dSLionel Sambuc r2 = std::move(r1);
153*0a6a1f1dSLionel Sambuc EXPECT_TRUE(r2.match("916"));
154*0a6a1f1dSLionel Sambuc }
155*0a6a1f1dSLionel Sambuc
156f4a2713aSLionel Sambuc }
157