Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(33)

Unified Diff: src/extensions/i18n/break-iterator.cc

Issue 18487004: Import the v8-i18n extension into v8 (Closed) Base URL: https://v8.googlecode.com/svn/branches/bleeding_edge
Patch Set: Created 7 years, 6 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
Index: src/extensions/i18n/break-iterator.cc
diff --git a/src/extensions/i18n/break-iterator.cc b/src/extensions/i18n/break-iterator.cc
new file mode 100644
index 0000000000000000000000000000000000000000..1225360fb73b744edf601a5c2fe3f55ebba12efb
--- /dev/null
+++ b/src/extensions/i18n/break-iterator.cc
@@ -0,0 +1,331 @@
+// Copyright 2013 the V8 project authors. All rights reserved.
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are
+// met:
+//
+// * Redistributions of source code must retain the above copyright
+// notice, this list of conditions and the following disclaimer.
+// * Redistributions in binary form must reproduce the above
+// copyright notice, this list of conditions and the following
+// disclaimer in the documentation and/or other materials provided
+// with the distribution.
+// * Neither the name of Google Inc. nor the names of its
+// contributors may be used to endorse or promote products derived
+// from this software without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+#include "break-iterator.h"
+
+#include <string.h>
+
+#include "i18n-utils.h"
+#include "unicode/brkiter.h"
+#include "unicode/locid.h"
+#include "unicode/rbbi.h"
+
+namespace v8_i18n {
+
+static v8::Handle<v8::Value> ThrowUnexpectedObjectError();
+static icu::UnicodeString* ResetAdoptedText(v8::Handle<v8::Object>,
+ v8::Handle<v8::Value>);
+static icu::BreakIterator* InitializeBreakIterator(v8::Handle<v8::String>,
+ v8::Handle<v8::Object>,
+ v8::Handle<v8::Object>);
+static icu::BreakIterator* CreateICUBreakIterator(const icu::Locale&,
+ v8::Handle<v8::Object>);
+static void SetResolvedSettings(const icu::Locale&,
+ icu::BreakIterator*,
+ v8::Handle<v8::Object>);
+
+icu::BreakIterator* BreakIterator::UnpackBreakIterator(
+ v8::Handle<v8::Object> obj) {
+ v8::HandleScope handle_scope;
+
+ // v8::ObjectTemplate doesn't have HasInstance method so we can't check
+ // if obj is an instance of BreakIterator class. We'll check for a property
+ // that has to be in the object. The same applies to other services, like
+ // Collator and DateTimeFormat.
+ if (obj->HasOwnProperty(v8::String::New("breakIterator"))) {
+ return static_cast<icu::BreakIterator*>(
+ obj->GetAlignedPointerFromInternalField(0));
+ }
+
+ return NULL;
+}
+
+void BreakIterator::DeleteBreakIterator(v8::Isolate* isolate,
+ v8::Persistent<v8::Object>* object,
+ void* param) {
+ // First delete the hidden C++ object.
+ // Unpacking should never return NULL here. That would only happen if
+ // this method is used as the weak callback for persistent handles not
+ // pointing to a break iterator.
+ v8::HandleScope handle_scope(isolate);
+ v8::Local<v8::Object> handle = v8::Local<v8::Object>::New(isolate, *object);
+ delete UnpackBreakIterator(handle);
+
+ delete static_cast<icu::UnicodeString*>(
+ handle->GetAlignedPointerFromInternalField(1));
+
+ // Then dispose of the persistent handle to JS object.
+ object->Dispose(isolate);
+}
+
+// Throws a JavaScript exception.
+static v8::Handle<v8::Value> ThrowUnexpectedObjectError() {
+ // Returns undefined, and schedules an exception to be thrown.
+ return v8::ThrowException(v8::Exception::Error(
+ v8::String::New("BreakIterator method called on an object "
+ "that is not a BreakIterator.")));
+}
+
+// Deletes the old value and sets the adopted text in corresponding
+// JavaScript object.
+icu::UnicodeString* ResetAdoptedText(
+ v8::Handle<v8::Object> obj, v8::Handle<v8::Value> value) {
+ // Get the previous value from the internal field.
+ icu::UnicodeString* text = static_cast<icu::UnicodeString*>(
+ obj->GetAlignedPointerFromInternalField(1));
+ delete text;
+
+ // Assign new value to the internal pointer.
+ v8::String::Value text_value(value);
+ text = new icu::UnicodeString(
+ reinterpret_cast<const UChar*>(*text_value), text_value.length());
+ obj->SetAlignedPointerInInternalField(1, text);
+
+ // Return new unicode string pointer.
+ return text;
+}
+
+void BreakIterator::JSInternalBreakIteratorAdoptText(
+ const v8::FunctionCallbackInfo<v8::Value>& args) {
+ if (args.Length() != 2 || !args[0]->IsObject() || !args[1]->IsString()) {
+ v8::ThrowException(v8::Exception::Error(
+ v8::String::New(
+ "Internal error. Iterator and text have to be specified.")));
+ return;
+ }
+
+ icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
+ if (!break_iterator) {
+ ThrowUnexpectedObjectError();
+ return;
+ }
+
+ break_iterator->setText(*ResetAdoptedText(args[0]->ToObject(), args[1]));
+}
+
+void BreakIterator::JSInternalBreakIteratorFirst(
+ const v8::FunctionCallbackInfo<v8::Value>& args) {
+ icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
+ if (!break_iterator) {
+ ThrowUnexpectedObjectError();
+ return;
+ }
+
+ args.GetReturnValue().Set(static_cast<int32_t>(break_iterator->first()));
+}
+
+void BreakIterator::JSInternalBreakIteratorNext(
+ const v8::FunctionCallbackInfo<v8::Value>& args) {
+ icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
+ if (!break_iterator) {
+ ThrowUnexpectedObjectError();
+ return;
+ }
+
+ args.GetReturnValue().Set(static_cast<int32_t>(break_iterator->next()));
+}
+
+void BreakIterator::JSInternalBreakIteratorCurrent(
+ const v8::FunctionCallbackInfo<v8::Value>& args) {
+ icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
+ if (!break_iterator) {
+ ThrowUnexpectedObjectError();
+ return;
+ }
+
+ args.GetReturnValue().Set(static_cast<int32_t>(break_iterator->current()));
+}
+
+void BreakIterator::JSInternalBreakIteratorBreakType(
+ const v8::FunctionCallbackInfo<v8::Value>& args) {
+ icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
+ if (!break_iterator) {
+ ThrowUnexpectedObjectError();
+ return;
+ }
+
+ // TODO(cira): Remove cast once ICU fixes base BreakIterator class.
+ icu::RuleBasedBreakIterator* rule_based_iterator =
+ static_cast<icu::RuleBasedBreakIterator*>(break_iterator);
+ int32_t status = rule_based_iterator->getRuleStatus();
+ // Keep return values in sync with JavaScript BreakType enum.
+ v8::Handle<v8::String> result;
+ if (status >= UBRK_WORD_NONE && status < UBRK_WORD_NONE_LIMIT) {
+ result = v8::String::New("none");
+ } else if (status >= UBRK_WORD_NUMBER && status < UBRK_WORD_NUMBER_LIMIT) {
+ result = v8::String::New("number");
+ } else if (status >= UBRK_WORD_LETTER && status < UBRK_WORD_LETTER_LIMIT) {
+ result = v8::String::New("letter");
+ } else if (status >= UBRK_WORD_KANA && status < UBRK_WORD_KANA_LIMIT) {
+ result = v8::String::New("kana");
+ } else if (status >= UBRK_WORD_IDEO && status < UBRK_WORD_IDEO_LIMIT) {
+ result = v8::String::New("ideo");
+ } else {
+ result = v8::String::New("unknown");
+ }
+ args.GetReturnValue().Set(result);
+}
+
+void BreakIterator::JSCreateBreakIterator(
+ const v8::FunctionCallbackInfo<v8::Value>& args) {
+ if (args.Length() != 3 || !args[0]->IsString() || !args[1]->IsObject() ||
+ !args[2]->IsObject()) {
+ v8::ThrowException(v8::Exception::Error(
+ v8::String::New("Internal error, wrong parameters.")));
+ return;
+ }
+
+ v8::Isolate* isolate = args.GetIsolate();
+ v8::Local<v8::ObjectTemplate> break_iterator_template =
+ Utils::GetTemplate2(isolate);
+
+ // Create an empty object wrapper.
+ v8::Local<v8::Object> local_object = break_iterator_template->NewInstance();
+ // But the handle shouldn't be empty.
+ // That can happen if there was a stack overflow when creating the object.
+ if (local_object.IsEmpty()) {
+ args.GetReturnValue().Set(local_object);
+ return;
+ }
+
+ // Set break iterator as internal field of the resulting JS object.
+ icu::BreakIterator* break_iterator = InitializeBreakIterator(
+ args[0]->ToString(), args[1]->ToObject(), args[2]->ToObject());
+
+ if (!break_iterator) {
+ v8::ThrowException(v8::Exception::Error(v8::String::New(
+ "Internal error. Couldn't create ICU break iterator.")));
+ return;
+ } else {
+ local_object->SetAlignedPointerInInternalField(0, break_iterator);
+ // Make sure that the pointer to adopted text is NULL.
+ local_object->SetAlignedPointerInInternalField(1, NULL);
+
+ v8::TryCatch try_catch;
+ local_object->Set(v8::String::New("breakIterator"),
+ v8::String::New("valid"));
+ if (try_catch.HasCaught()) {
+ v8::ThrowException(v8::Exception::Error(
+ v8::String::New("Internal error, couldn't set property.")));
+ return;
+ }
+ }
+
+ v8::Persistent<v8::Object> wrapper(isolate, local_object);
+ // Make object handle weak so we can delete iterator once GC kicks in.
+ wrapper.MakeWeak<void>(NULL, &DeleteBreakIterator);
+ args.GetReturnValue().Set(wrapper);
+ wrapper.ClearAndLeak();
+}
+
+static icu::BreakIterator* InitializeBreakIterator(
+ v8::Handle<v8::String> locale,
+ v8::Handle<v8::Object> options,
+ v8::Handle<v8::Object> resolved) {
+ // Convert BCP47 into ICU locale format.
+ UErrorCode status = U_ZERO_ERROR;
+ icu::Locale icu_locale;
+ char icu_result[ULOC_FULLNAME_CAPACITY];
+ int icu_length = 0;
+ v8::String::AsciiValue bcp47_locale(locale);
+ if (bcp47_locale.length() != 0) {
+ uloc_forLanguageTag(*bcp47_locale, icu_result, ULOC_FULLNAME_CAPACITY,
+ &icu_length, &status);
+ if (U_FAILURE(status) || icu_length == 0) {
+ return NULL;
+ }
+ icu_locale = icu::Locale(icu_result);
+ }
+
+ icu::BreakIterator* break_iterator =
+ CreateICUBreakIterator(icu_locale, options);
+ if (!break_iterator) {
+ // Remove extensions and try again.
+ icu::Locale no_extension_locale(icu_locale.getBaseName());
+ break_iterator = CreateICUBreakIterator(no_extension_locale, options);
+
+ // Set resolved settings (locale).
+ SetResolvedSettings(no_extension_locale, break_iterator, resolved);
+ } else {
+ SetResolvedSettings(icu_locale, break_iterator, resolved);
+ }
+
+ return break_iterator;
+}
+
+static icu::BreakIterator* CreateICUBreakIterator(
+ const icu::Locale& icu_locale, v8::Handle<v8::Object> options) {
+ UErrorCode status = U_ZERO_ERROR;
+ icu::BreakIterator* break_iterator = NULL;
+ icu::UnicodeString type;
+ if (!Utils::ExtractStringSetting(options, "type", &type)) {
+ // Type had to be in the options. This would be an internal error.
+ return NULL;
+ }
+
+ if (type == UNICODE_STRING_SIMPLE("character")) {
+ break_iterator =
+ icu::BreakIterator::createCharacterInstance(icu_locale, status);
+ } else if (type == UNICODE_STRING_SIMPLE("sentence")) {
+ break_iterator =
+ icu::BreakIterator::createSentenceInstance(icu_locale, status);
+ } else if (type == UNICODE_STRING_SIMPLE("line")) {
+ break_iterator =
+ icu::BreakIterator::createLineInstance(icu_locale, status);
+ } else {
+ // Defualt is word iterator.
+ break_iterator =
+ icu::BreakIterator::createWordInstance(icu_locale, status);
+ }
+
+ if (U_FAILURE(status)) {
+ delete break_iterator;
+ return NULL;
+ }
+
+ return break_iterator;
+}
+
+static void SetResolvedSettings(const icu::Locale& icu_locale,
+ icu::BreakIterator* date_format,
+ v8::Handle<v8::Object> resolved) {
+ UErrorCode status = U_ZERO_ERROR;
+
+ // Set the locale
+ char result[ULOC_FULLNAME_CAPACITY];
+ status = U_ZERO_ERROR;
+ uloc_toLanguageTag(
+ icu_locale.getName(), result, ULOC_FULLNAME_CAPACITY, FALSE, &status);
+ if (U_SUCCESS(status)) {
+ resolved->Set(v8::String::New("locale"), v8::String::New(result));
+ } else {
+ // This would never happen, since we got the locale from ICU.
+ resolved->Set(v8::String::New("locale"), v8::String::New("und"));
+ }
+}
+
+} // namespace v8_i18n

Powered by Google App Engine
This is Rietveld 408576698