OLD | NEW |
(Empty) | |
| 1 // Copyright (C) 2011 Google Inc. |
| 2 // |
| 3 // Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 // you may not use this file except in compliance with the License. |
| 5 // You may obtain a copy of the License at |
| 6 // |
| 7 // http://www.apache.org/licenses/LICENSE-2.0 |
| 8 // |
| 9 // Unless required by applicable law or agreed to in writing, software |
| 10 // distributed under the License is distributed on an "AS IS" BASIS, |
| 11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 12 // See the License for the specific language governing permissions and |
| 13 // limitations under the License. |
| 14 |
| 15 // Author: George Yakovlev |
| 16 // Philippe Liard |
| 17 |
| 18 #include "regexp_adapter.h" |
| 19 |
| 20 #include <string> |
| 21 |
| 22 #include <gtest/gtest.h> |
| 23 |
| 24 #include "base/memory/scoped_ptr.h" |
| 25 |
| 26 namespace i18n { |
| 27 namespace phonenumbers { |
| 28 |
| 29 using std::string; |
| 30 |
| 31 class RegExpAdapterTest : public testing::Test { |
| 32 protected: |
| 33 RegExpAdapterTest() |
| 34 : digits_(RegExp::Create("\\d+")), |
| 35 parentheses_digits_(RegExp::Create("\\((\\d+)\\)")), |
| 36 single_digit_(RegExp::Create("\\d")), |
| 37 two_digit_groups_(RegExp::Create("(\\d+)-(\\d+)")) {} |
| 38 |
| 39 const scoped_ptr<const RegExp> digits_; |
| 40 const scoped_ptr<const RegExp> parentheses_digits_; |
| 41 const scoped_ptr<const RegExp> single_digit_; |
| 42 const scoped_ptr<const RegExp> two_digit_groups_; |
| 43 }; |
| 44 |
| 45 TEST_F(RegExpAdapterTest, TestConsumeNoMatch) { |
| 46 const scoped_ptr<RegExpInput> input(RegExpInput::Create("+1-123-456-789")); |
| 47 |
| 48 // When 'true' is passed to Consume(), the match occurs from the beginning of |
| 49 // the input. |
| 50 ASSERT_FALSE(digits_->Consume(input.get(), true, NULL, NULL, NULL)); |
| 51 ASSERT_EQ("+1-123-456-789", input->ToString()); |
| 52 |
| 53 string res1; |
| 54 ASSERT_FALSE(parentheses_digits_->Consume( |
| 55 input.get(), true, &res1, NULL, NULL)); |
| 56 ASSERT_EQ("+1-123-456-789", input->ToString()); |
| 57 ASSERT_EQ("", res1); |
| 58 } |
| 59 |
| 60 TEST_F(RegExpAdapterTest, TestConsumeWithNull) { |
| 61 const scoped_ptr<RegExpInput> input(RegExpInput::Create("+123")); |
| 62 const scoped_ptr<const RegExp> plus_sign(RegExp::Create("(\\+)")); |
| 63 |
| 64 ASSERT_TRUE(plus_sign->Consume(input.get(), true, NULL, NULL, NULL)); |
| 65 ASSERT_EQ("123", input->ToString()); |
| 66 } |
| 67 |
| 68 TEST_F(RegExpAdapterTest, TestConsumeRetainsMatches) { |
| 69 const scoped_ptr<RegExpInput> input(RegExpInput::Create("1-123-456-789")); |
| 70 |
| 71 string res1, res2; |
| 72 ASSERT_TRUE(two_digit_groups_->Consume( |
| 73 input.get(), true, &res1, &res2, NULL)); |
| 74 ASSERT_EQ("-456-789", input->ToString()); |
| 75 ASSERT_EQ("1", res1); |
| 76 ASSERT_EQ("123", res2); |
| 77 } |
| 78 |
| 79 TEST_F(RegExpAdapterTest, TestFindAndConsume) { |
| 80 const scoped_ptr<RegExpInput> input(RegExpInput::Create("+1-123-456-789")); |
| 81 |
| 82 // When 'false' is passed to Consume(), the match can occur from any place in |
| 83 // the input. |
| 84 ASSERT_TRUE(digits_->Consume(input.get(), false, NULL, NULL, NULL)); |
| 85 ASSERT_EQ("-123-456-789", input->ToString()); |
| 86 |
| 87 ASSERT_TRUE(digits_->Consume(input.get(), false, NULL, NULL, NULL)); |
| 88 ASSERT_EQ("-456-789", input->ToString()); |
| 89 |
| 90 ASSERT_FALSE(parentheses_digits_->Consume( |
| 91 input.get(), false, NULL, NULL, NULL)); |
| 92 ASSERT_EQ("-456-789", input->ToString()); |
| 93 |
| 94 string res1, res2; |
| 95 ASSERT_TRUE(two_digit_groups_->Consume( |
| 96 input.get(), false, &res1, &res2, NULL)); |
| 97 ASSERT_EQ("", input->ToString()); |
| 98 ASSERT_EQ("456", res1); |
| 99 ASSERT_EQ("789", res2); |
| 100 } |
| 101 |
| 102 TEST(RegExpAdapter, TestPartialMatch) { |
| 103 const scoped_ptr<const RegExp> reg_exp(RegExp::Create("([\\da-z]+)")); |
| 104 string matched; |
| 105 |
| 106 EXPECT_TRUE(reg_exp->PartialMatch("12345af", &matched)); |
| 107 EXPECT_EQ("12345af", matched); |
| 108 |
| 109 EXPECT_TRUE(reg_exp->PartialMatch("12345af", NULL)); |
| 110 |
| 111 EXPECT_TRUE(reg_exp->PartialMatch("[12]", &matched)); |
| 112 EXPECT_EQ("12", matched); |
| 113 |
| 114 matched.clear(); |
| 115 EXPECT_FALSE(reg_exp->PartialMatch("[]", &matched)); |
| 116 EXPECT_EQ("", matched); |
| 117 } |
| 118 |
| 119 TEST(RegExpAdapter, TestFullMatch) { |
| 120 const scoped_ptr<const RegExp> reg_exp(RegExp::Create("([\\da-z]+)")); |
| 121 string matched; |
| 122 |
| 123 EXPECT_TRUE(reg_exp->FullMatch("12345af", &matched)); |
| 124 EXPECT_EQ("12345af", matched); |
| 125 |
| 126 EXPECT_TRUE(reg_exp->FullMatch("12345af", NULL)); |
| 127 |
| 128 matched.clear(); |
| 129 EXPECT_FALSE(reg_exp->FullMatch("[12]", &matched)); |
| 130 EXPECT_EQ("", matched); |
| 131 |
| 132 matched.clear(); |
| 133 EXPECT_FALSE(reg_exp->FullMatch("[]", &matched)); |
| 134 EXPECT_EQ("", matched); |
| 135 } |
| 136 |
| 137 TEST_F(RegExpAdapterTest, TestReplace) { |
| 138 string input("123-4567 "); |
| 139 |
| 140 ASSERT_TRUE(single_digit_->Replace(&input, "+")); |
| 141 ASSERT_EQ("+23-4567 ", input); |
| 142 |
| 143 ASSERT_TRUE(single_digit_->Replace(&input, "+")); |
| 144 ASSERT_EQ("++3-4567 ", input); |
| 145 |
| 146 const scoped_ptr<const RegExp> single_letter(RegExp::Create("[a-z]")); |
| 147 ASSERT_FALSE(single_letter->Replace(&input, "+")); |
| 148 ASSERT_EQ("++3-4567 ", input); |
| 149 } |
| 150 |
| 151 TEST_F(RegExpAdapterTest, TestReplaceWithGroup) { |
| 152 // Make sure referencing groups in the regexp in the replacement string works. |
| 153 // $[0-9] notation is used. |
| 154 string input = "123-4567 abc"; |
| 155 ASSERT_TRUE(two_digit_groups_->Replace(&input, "$2")); |
| 156 ASSERT_EQ("4567 abc", input); |
| 157 |
| 158 input = "123-4567"; |
| 159 ASSERT_TRUE(two_digit_groups_->Replace(&input, "$1")); |
| 160 ASSERT_EQ("123", input); |
| 161 |
| 162 input = "123-4567"; |
| 163 ASSERT_TRUE(two_digit_groups_->Replace(&input, "$2")); |
| 164 ASSERT_EQ("4567", input); |
| 165 |
| 166 input = "123-4567"; |
| 167 ASSERT_TRUE(two_digit_groups_->Replace(&input, "$1 $2")); |
| 168 ASSERT_EQ("123 4567", input); |
| 169 } |
| 170 |
| 171 TEST_F(RegExpAdapterTest, TestReplaceWithDollarSign) { |
| 172 // Make sure '$' can be used in the replacement string when escaped. |
| 173 string input = "123-4567"; |
| 174 ASSERT_TRUE(two_digit_groups_->Replace(&input, "\\$1 \\$2")); |
| 175 ASSERT_EQ("$1 $2", input); |
| 176 } |
| 177 |
| 178 TEST_F(RegExpAdapterTest, TestGlobalReplace) { |
| 179 string input("123-4567 "); |
| 180 |
| 181 ASSERT_TRUE(single_digit_->GlobalReplace(&input, "*")); |
| 182 ASSERT_EQ("***-**** ", input); |
| 183 |
| 184 ASSERT_FALSE(single_digit_->GlobalReplace(&input, "*")); |
| 185 ASSERT_EQ("***-**** ", input); |
| 186 } |
| 187 |
| 188 TEST(RegExpAdapter, TestUtf8) { |
| 189 const scoped_ptr<const RegExp> reg_exp(RegExp::Create("\xE2\x84\xA1\xE2\x8A\x8
F([\xCE\xB1-\xCF\x89]*)\xE2\x8A\x90")); |
| 190 string matched; |
| 191 |
| 192 EXPECT_FALSE(reg_exp->Match("\xE2\x84\xA1\xE2\x8A\x8F" "123\xE2\x8A\x90", true
, &matched)); |
| 193 EXPECT_TRUE(reg_exp->Match("\xE2\x84\xA1\xE2\x8A\x8F\xCE\xB1\xCE\xB2\xE2\x8A\x
90", true, &matched)); |
| 194 EXPECT_EQ("\xCE\xB1\xCE\xB2", matched); |
| 195 } |
| 196 |
| 197 } // namespace phonenumbers |
| 198 } // namespace i18n |
OLD | NEW |