OLD | NEW |
| (Empty) |
1 // Copyright (C) 2011 Google Inc. | |
2 // | |
3 // Licensed under the Apache License, Version 2.0 (the "License"); | |
4 // you may not use this file except in compliance with the License. | |
5 // You may obtain a copy of the License at | |
6 // | |
7 // http://www.apache.org/licenses/LICENSE-2.0 | |
8 // | |
9 // Unless required by applicable law or agreed to in writing, software | |
10 // distributed under the License is distributed on an "AS IS" BASIS, | |
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
12 // See the License for the specific language governing permissions and | |
13 // limitations under the License. | |
14 | |
15 // Author: George Yakovlev | |
16 // Philippe Liard | |
17 | |
18 #include "regexp_adapter.h" | |
19 | |
20 #include <string> | |
21 | |
22 #include <gtest/gtest.h> | |
23 | |
24 #include "base/memory/scoped_ptr.h" | |
25 | |
26 namespace i18n { | |
27 namespace phonenumbers { | |
28 | |
29 using std::string; | |
30 | |
31 class RegExpAdapterTest : public testing::Test { | |
32 protected: | |
33 RegExpAdapterTest() | |
34 : digits_(RegExp::Create("\\d+")), | |
35 parentheses_digits_(RegExp::Create("\\((\\d+)\\)")), | |
36 single_digit_(RegExp::Create("\\d")), | |
37 two_digit_groups_(RegExp::Create("(\\d+)-(\\d+)")) {} | |
38 | |
39 const scoped_ptr<const RegExp> digits_; | |
40 const scoped_ptr<const RegExp> parentheses_digits_; | |
41 const scoped_ptr<const RegExp> single_digit_; | |
42 const scoped_ptr<const RegExp> two_digit_groups_; | |
43 }; | |
44 | |
45 TEST_F(RegExpAdapterTest, TestConsumeNoMatch) { | |
46 const scoped_ptr<RegExpInput> input(RegExpInput::Create("+1-123-456-789")); | |
47 | |
48 // When 'true' is passed to Consume(), the match occurs from the beginning of | |
49 // the input. | |
50 ASSERT_FALSE(digits_->Consume(input.get(), true, NULL, NULL, NULL)); | |
51 ASSERT_EQ("+1-123-456-789", input->ToString()); | |
52 | |
53 string res1; | |
54 ASSERT_FALSE(parentheses_digits_->Consume( | |
55 input.get(), true, &res1, NULL, NULL)); | |
56 ASSERT_EQ("+1-123-456-789", input->ToString()); | |
57 ASSERT_EQ("", res1); | |
58 } | |
59 | |
60 TEST_F(RegExpAdapterTest, TestConsumeWithNull) { | |
61 const scoped_ptr<RegExpInput> input(RegExpInput::Create("+123")); | |
62 const scoped_ptr<const RegExp> plus_sign(RegExp::Create("(\\+)")); | |
63 | |
64 ASSERT_TRUE(plus_sign->Consume(input.get(), true, NULL, NULL, NULL)); | |
65 ASSERT_EQ("123", input->ToString()); | |
66 } | |
67 | |
68 TEST_F(RegExpAdapterTest, TestConsumeRetainsMatches) { | |
69 const scoped_ptr<RegExpInput> input(RegExpInput::Create("1-123-456-789")); | |
70 | |
71 string res1, res2; | |
72 ASSERT_TRUE(two_digit_groups_->Consume( | |
73 input.get(), true, &res1, &res2, NULL)); | |
74 ASSERT_EQ("-456-789", input->ToString()); | |
75 ASSERT_EQ("1", res1); | |
76 ASSERT_EQ("123", res2); | |
77 } | |
78 | |
79 TEST_F(RegExpAdapterTest, TestFindAndConsume) { | |
80 const scoped_ptr<RegExpInput> input(RegExpInput::Create("+1-123-456-789")); | |
81 | |
82 // When 'false' is passed to Consume(), the match can occur from any place in | |
83 // the input. | |
84 ASSERT_TRUE(digits_->Consume(input.get(), false, NULL, NULL, NULL)); | |
85 ASSERT_EQ("-123-456-789", input->ToString()); | |
86 | |
87 ASSERT_TRUE(digits_->Consume(input.get(), false, NULL, NULL, NULL)); | |
88 ASSERT_EQ("-456-789", input->ToString()); | |
89 | |
90 ASSERT_FALSE(parentheses_digits_->Consume( | |
91 input.get(), false, NULL, NULL, NULL)); | |
92 ASSERT_EQ("-456-789", input->ToString()); | |
93 | |
94 string res1, res2; | |
95 ASSERT_TRUE(two_digit_groups_->Consume( | |
96 input.get(), false, &res1, &res2, NULL)); | |
97 ASSERT_EQ("", input->ToString()); | |
98 ASSERT_EQ("456", res1); | |
99 ASSERT_EQ("789", res2); | |
100 } | |
101 | |
102 TEST(RegExpAdapter, TestPartialMatch) { | |
103 const scoped_ptr<const RegExp> reg_exp(RegExp::Create("([\\da-z]+)")); | |
104 string matched; | |
105 | |
106 EXPECT_TRUE(reg_exp->PartialMatch("12345af", &matched)); | |
107 EXPECT_EQ("12345af", matched); | |
108 | |
109 EXPECT_TRUE(reg_exp->PartialMatch("12345af", NULL)); | |
110 | |
111 EXPECT_TRUE(reg_exp->PartialMatch("[12]", &matched)); | |
112 EXPECT_EQ("12", matched); | |
113 | |
114 matched.clear(); | |
115 EXPECT_FALSE(reg_exp->PartialMatch("[]", &matched)); | |
116 EXPECT_EQ("", matched); | |
117 } | |
118 | |
119 TEST(RegExpAdapter, TestFullMatch) { | |
120 const scoped_ptr<const RegExp> reg_exp(RegExp::Create("([\\da-z]+)")); | |
121 string matched; | |
122 | |
123 EXPECT_TRUE(reg_exp->FullMatch("12345af", &matched)); | |
124 EXPECT_EQ("12345af", matched); | |
125 | |
126 EXPECT_TRUE(reg_exp->FullMatch("12345af", NULL)); | |
127 | |
128 matched.clear(); | |
129 EXPECT_FALSE(reg_exp->FullMatch("[12]", &matched)); | |
130 EXPECT_EQ("", matched); | |
131 | |
132 matched.clear(); | |
133 EXPECT_FALSE(reg_exp->FullMatch("[]", &matched)); | |
134 EXPECT_EQ("", matched); | |
135 } | |
136 | |
137 TEST_F(RegExpAdapterTest, TestReplace) { | |
138 string input("123-4567 "); | |
139 | |
140 ASSERT_TRUE(single_digit_->Replace(&input, "+")); | |
141 ASSERT_EQ("+23-4567 ", input); | |
142 | |
143 ASSERT_TRUE(single_digit_->Replace(&input, "+")); | |
144 ASSERT_EQ("++3-4567 ", input); | |
145 | |
146 const scoped_ptr<const RegExp> single_letter(RegExp::Create("[a-z]")); | |
147 ASSERT_FALSE(single_letter->Replace(&input, "+")); | |
148 ASSERT_EQ("++3-4567 ", input); | |
149 } | |
150 | |
151 TEST_F(RegExpAdapterTest, TestReplaceWithGroup) { | |
152 // Make sure referencing groups in the regexp in the replacement string works. | |
153 // $[0-9] notation is used. | |
154 string input = "123-4567 abc"; | |
155 ASSERT_TRUE(two_digit_groups_->Replace(&input, "$2")); | |
156 ASSERT_EQ("4567 abc", input); | |
157 | |
158 input = "123-4567"; | |
159 ASSERT_TRUE(two_digit_groups_->Replace(&input, "$1")); | |
160 ASSERT_EQ("123", input); | |
161 | |
162 input = "123-4567"; | |
163 ASSERT_TRUE(two_digit_groups_->Replace(&input, "$2")); | |
164 ASSERT_EQ("4567", input); | |
165 | |
166 input = "123-4567"; | |
167 ASSERT_TRUE(two_digit_groups_->Replace(&input, "$1 $2")); | |
168 ASSERT_EQ("123 4567", input); | |
169 } | |
170 | |
171 TEST_F(RegExpAdapterTest, TestReplaceWithDollarSign) { | |
172 // Make sure '$' can be used in the replacement string when escaped. | |
173 string input = "123-4567"; | |
174 ASSERT_TRUE(two_digit_groups_->Replace(&input, "\\$1 \\$2")); | |
175 ASSERT_EQ("$1 $2", input); | |
176 } | |
177 | |
178 TEST_F(RegExpAdapterTest, TestGlobalReplace) { | |
179 string input("123-4567 "); | |
180 | |
181 ASSERT_TRUE(single_digit_->GlobalReplace(&input, "*")); | |
182 ASSERT_EQ("***-**** ", input); | |
183 | |
184 ASSERT_FALSE(single_digit_->GlobalReplace(&input, "*")); | |
185 ASSERT_EQ("***-**** ", input); | |
186 } | |
187 | |
188 TEST(RegExpAdapter, TestUtf8) { | |
189 const scoped_ptr<const RegExp> reg_exp(RegExp::Create("\xE2\x84\xA1\xE2\x8A\x8
F([\xCE\xB1-\xCF\x89]*)\xE2\x8A\x90")); | |
190 string matched; | |
191 | |
192 EXPECT_FALSE(reg_exp->Match("\xE2\x84\xA1\xE2\x8A\x8F" "123\xE2\x8A\x90", true
, &matched)); | |
193 EXPECT_TRUE(reg_exp->Match("\xE2\x84\xA1\xE2\x8A\x8F\xCE\xB1\xCE\xB2\xE2\x8A\x
90", true, &matched)); | |
194 EXPECT_EQ("\xCE\xB1\xCE\xB2", matched); | |
195 } | |
196 | |
197 } // namespace phonenumbers | |
198 } // namespace i18n | |
OLD | NEW |