Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(3165)

Unified Diff: chrome/renderer/spellchecker/spellcheck_worditerator.cc

Issue 270203003: Refactor code to avoid direct dependency upon ICU: spellcheck_worditerator (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@refactoring_icu_usage
Patch Set: jungshik@ comments Created 6 years, 7 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« no previous file with comments | « chrome/renderer/spellchecker/spellcheck_worditerator.h ('k') | no next file » | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: chrome/renderer/spellchecker/spellcheck_worditerator.cc
diff --git a/chrome/renderer/spellchecker/spellcheck_worditerator.cc b/chrome/renderer/spellchecker/spellcheck_worditerator.cc
index 1297c5ab8f202afaefa6606f26724257f3e59de2..a84904293ea580f0988f91c1c5669c390794fd7a 100644
--- a/chrome/renderer/spellchecker/spellcheck_worditerator.cc
+++ b/chrome/renderer/spellchecker/spellcheck_worditerator.cc
@@ -10,6 +10,7 @@
#include <string>
#include "base/basictypes.h"
+#include "base/i18n/break_iterator.h"
#include "base/logging.h"
#include "base/strings/stringprintf.h"
#include "base/strings/utf_string_conversions.h"
@@ -299,10 +300,8 @@ bool SpellcheckCharAttribute::OutputDefault(UChar c,
SpellcheckWordIterator::SpellcheckWordIterator()
: text_(NULL),
- length_(0),
- position_(UBRK_DONE),
attribute_(NULL),
- iterator_(NULL) {
+ iterator_() {
}
SpellcheckWordIterator::~SpellcheckWordIterator() {
@@ -315,18 +314,22 @@ bool SpellcheckWordIterator::Initialize(
// Create a custom ICU break iterator with empty text used in this object. (We
// allow setting text later so we can re-use this iterator.)
DCHECK(attribute);
- UErrorCode open_status = U_ZERO_ERROR;
- UParseError parse_status;
- base::string16 rule(attribute->GetRuleSet(allow_contraction));
+ const base::string16 rule(attribute->GetRuleSet(allow_contraction));
// If there is no rule set, the attributes were invalid.
if (rule.empty())
return false;
- iterator_ = ubrk_openRules(rule.c_str(), rule.length(), NULL, 0,
- &parse_status, &open_status);
- if (U_FAILURE(open_status))
+ scoped_ptr<base::i18n::BreakIterator> iterator(
+ new base::i18n::BreakIterator(base::string16(), rule));
+ if (!iterator->Init()) {
+ // Since we're not passing in any text, the only reason this could fail
+ // is if we fail to parse the rules. Since the rules are hardcoded,
+ // that would be a bug in this class.
+ NOTREACHED() << "failed to open iterator (broken rules)";
return false;
+ }
+ iterator_ = iterator.Pass();
// Set the character attributes so we can normalize the words extracted by
// this iterator.
@@ -335,7 +338,7 @@ bool SpellcheckWordIterator::Initialize(
}
bool SpellcheckWordIterator::IsInitialized() const {
- // Return true if we have an ICU custom iterator.
+ // Return true iff we have an iterator.
return !!iterator_;
}
@@ -343,66 +346,51 @@ bool SpellcheckWordIterator::SetText(const base::char16* text, size_t length) {
DCHECK(!!iterator_);
// Set the text to be split by this iterator.
- UErrorCode status = U_ZERO_ERROR;
- ubrk_setText(iterator_, text, length, &status);
- if (U_FAILURE(status))
- return false;
-
- // Retrieve the position to the first word in this text. We return false if
- // this text does not have any words. (For example, The input text consists
- // only of Chinese characters while the spellchecker language is English.)
- position_ = ubrk_first(iterator_);
- if (position_ == UBRK_DONE)
+ if (!iterator_->SetText(text, length)) {
+ LOG(ERROR) << "failed to set text";
return false;
+ }
text_ = text;
- length_ = static_cast<int>(length);
return true;
}
bool SpellcheckWordIterator::GetNextWord(base::string16* word_string,
int* word_start,
int* word_length) {
- DCHECK(!!text_ && length_ > 0);
+ DCHECK(!!text_);
word_string->clear();
*word_start = 0;
*word_length = 0;
- if (!text_ || position_ == UBRK_DONE)
+ if (!text_) {
return false;
+ }
// Find a word that can be checked for spelling. Our rule sets filter out
// invalid words (e.g. numbers and characters not supported by the
// spellchecker language) so this ubrk_getRuleStatus() call returns
// UBRK_WORD_NONE when this iterator finds an invalid word. So, we skip such
// words until we can find a valid word or reach the end of the input string.
- int next = ubrk_next(iterator_);
- while (next != UBRK_DONE) {
- if (ubrk_getRuleStatus(iterator_) != UBRK_WORD_NONE) {
- if (Normalize(position_, next - position_, word_string)) {
- *word_start = position_;
- *word_length = next - position_;
- position_ = next;
+ while (iterator_->Advance()) {
+ const size_t start = iterator_->prev();
+ const size_t length = iterator_->pos() - start;
+ if (iterator_->IsWord()) {
+ if (Normalize(start, length, word_string)) {
+ *word_start = start;
+ *word_length = length;
return true;
}
}
- position_ = next;
- next = ubrk_next(iterator_);
}
- // There aren't any more words in the given text. Set the position to
- // UBRK_DONE to prevent from calling ubrk_next() next time when this function
- // is called.
- position_ = UBRK_DONE;
+ // There aren't any more words in the given text.
return false;
}
void SpellcheckWordIterator::Reset() {
- if (iterator_) {
- ubrk_close(iterator_);
- iterator_ = NULL;
- }
+ iterator_.reset();
}
bool SpellcheckWordIterator::Normalize(int input_start,
« no previous file with comments | « chrome/renderer/spellchecker/spellcheck_worditerator.h ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698