| Index: src/extensions/i18n/break-iterator.cc
|
| diff --git a/src/extensions/i18n/break-iterator.cc b/src/extensions/i18n/break-iterator.cc
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..1225360fb73b744edf601a5c2fe3f55ebba12efb
|
| --- /dev/null
|
| +++ b/src/extensions/i18n/break-iterator.cc
|
| @@ -0,0 +1,331 @@
|
| +// Copyright 2013 the V8 project authors. All rights reserved.
|
| +// Redistribution and use in source and binary forms, with or without
|
| +// modification, are permitted provided that the following conditions are
|
| +// met:
|
| +//
|
| +// * Redistributions of source code must retain the above copyright
|
| +// notice, this list of conditions and the following disclaimer.
|
| +// * Redistributions in binary form must reproduce the above
|
| +// copyright notice, this list of conditions and the following
|
| +// disclaimer in the documentation and/or other materials provided
|
| +// with the distribution.
|
| +// * Neither the name of Google Inc. nor the names of its
|
| +// contributors may be used to endorse or promote products derived
|
| +// from this software without specific prior written permission.
|
| +//
|
| +// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
| +// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
| +// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
| +// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
| +// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
| +// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
| +// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
| +// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
| +// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
| +// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
| +// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
| +
|
| +#include "break-iterator.h"
|
| +
|
| +#include <string.h>
|
| +
|
| +#include "i18n-utils.h"
|
| +#include "unicode/brkiter.h"
|
| +#include "unicode/locid.h"
|
| +#include "unicode/rbbi.h"
|
| +
|
| +namespace v8_i18n {
|
| +
|
| +static v8::Handle<v8::Value> ThrowUnexpectedObjectError();
|
| +static icu::UnicodeString* ResetAdoptedText(v8::Handle<v8::Object>,
|
| + v8::Handle<v8::Value>);
|
| +static icu::BreakIterator* InitializeBreakIterator(v8::Handle<v8::String>,
|
| + v8::Handle<v8::Object>,
|
| + v8::Handle<v8::Object>);
|
| +static icu::BreakIterator* CreateICUBreakIterator(const icu::Locale&,
|
| + v8::Handle<v8::Object>);
|
| +static void SetResolvedSettings(const icu::Locale&,
|
| + icu::BreakIterator*,
|
| + v8::Handle<v8::Object>);
|
| +
|
| +icu::BreakIterator* BreakIterator::UnpackBreakIterator(
|
| + v8::Handle<v8::Object> obj) {
|
| + v8::HandleScope handle_scope;
|
| +
|
| + // v8::ObjectTemplate doesn't have HasInstance method so we can't check
|
| + // if obj is an instance of BreakIterator class. We'll check for a property
|
| + // that has to be in the object. The same applies to other services, like
|
| + // Collator and DateTimeFormat.
|
| + if (obj->HasOwnProperty(v8::String::New("breakIterator"))) {
|
| + return static_cast<icu::BreakIterator*>(
|
| + obj->GetAlignedPointerFromInternalField(0));
|
| + }
|
| +
|
| + return NULL;
|
| +}
|
| +
|
| +void BreakIterator::DeleteBreakIterator(v8::Isolate* isolate,
|
| + v8::Persistent<v8::Object>* object,
|
| + void* param) {
|
| + // First delete the hidden C++ object.
|
| + // Unpacking should never return NULL here. That would only happen if
|
| + // this method is used as the weak callback for persistent handles not
|
| + // pointing to a break iterator.
|
| + v8::HandleScope handle_scope(isolate);
|
| + v8::Local<v8::Object> handle = v8::Local<v8::Object>::New(isolate, *object);
|
| + delete UnpackBreakIterator(handle);
|
| +
|
| + delete static_cast<icu::UnicodeString*>(
|
| + handle->GetAlignedPointerFromInternalField(1));
|
| +
|
| + // Then dispose of the persistent handle to JS object.
|
| + object->Dispose(isolate);
|
| +}
|
| +
|
| +// Throws a JavaScript exception.
|
| +static v8::Handle<v8::Value> ThrowUnexpectedObjectError() {
|
| + // Returns undefined, and schedules an exception to be thrown.
|
| + return v8::ThrowException(v8::Exception::Error(
|
| + v8::String::New("BreakIterator method called on an object "
|
| + "that is not a BreakIterator.")));
|
| +}
|
| +
|
| +// Deletes the old value and sets the adopted text in corresponding
|
| +// JavaScript object.
|
| +icu::UnicodeString* ResetAdoptedText(
|
| + v8::Handle<v8::Object> obj, v8::Handle<v8::Value> value) {
|
| + // Get the previous value from the internal field.
|
| + icu::UnicodeString* text = static_cast<icu::UnicodeString*>(
|
| + obj->GetAlignedPointerFromInternalField(1));
|
| + delete text;
|
| +
|
| + // Assign new value to the internal pointer.
|
| + v8::String::Value text_value(value);
|
| + text = new icu::UnicodeString(
|
| + reinterpret_cast<const UChar*>(*text_value), text_value.length());
|
| + obj->SetAlignedPointerInInternalField(1, text);
|
| +
|
| + // Return new unicode string pointer.
|
| + return text;
|
| +}
|
| +
|
| +void BreakIterator::JSInternalBreakIteratorAdoptText(
|
| + const v8::FunctionCallbackInfo<v8::Value>& args) {
|
| + if (args.Length() != 2 || !args[0]->IsObject() || !args[1]->IsString()) {
|
| + v8::ThrowException(v8::Exception::Error(
|
| + v8::String::New(
|
| + "Internal error. Iterator and text have to be specified.")));
|
| + return;
|
| + }
|
| +
|
| + icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
|
| + if (!break_iterator) {
|
| + ThrowUnexpectedObjectError();
|
| + return;
|
| + }
|
| +
|
| + break_iterator->setText(*ResetAdoptedText(args[0]->ToObject(), args[1]));
|
| +}
|
| +
|
| +void BreakIterator::JSInternalBreakIteratorFirst(
|
| + const v8::FunctionCallbackInfo<v8::Value>& args) {
|
| + icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
|
| + if (!break_iterator) {
|
| + ThrowUnexpectedObjectError();
|
| + return;
|
| + }
|
| +
|
| + args.GetReturnValue().Set(static_cast<int32_t>(break_iterator->first()));
|
| +}
|
| +
|
| +void BreakIterator::JSInternalBreakIteratorNext(
|
| + const v8::FunctionCallbackInfo<v8::Value>& args) {
|
| + icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
|
| + if (!break_iterator) {
|
| + ThrowUnexpectedObjectError();
|
| + return;
|
| + }
|
| +
|
| + args.GetReturnValue().Set(static_cast<int32_t>(break_iterator->next()));
|
| +}
|
| +
|
| +void BreakIterator::JSInternalBreakIteratorCurrent(
|
| + const v8::FunctionCallbackInfo<v8::Value>& args) {
|
| + icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
|
| + if (!break_iterator) {
|
| + ThrowUnexpectedObjectError();
|
| + return;
|
| + }
|
| +
|
| + args.GetReturnValue().Set(static_cast<int32_t>(break_iterator->current()));
|
| +}
|
| +
|
| +void BreakIterator::JSInternalBreakIteratorBreakType(
|
| + const v8::FunctionCallbackInfo<v8::Value>& args) {
|
| + icu::BreakIterator* break_iterator = UnpackBreakIterator(args[0]->ToObject());
|
| + if (!break_iterator) {
|
| + ThrowUnexpectedObjectError();
|
| + return;
|
| + }
|
| +
|
| + // TODO(cira): Remove cast once ICU fixes base BreakIterator class.
|
| + icu::RuleBasedBreakIterator* rule_based_iterator =
|
| + static_cast<icu::RuleBasedBreakIterator*>(break_iterator);
|
| + int32_t status = rule_based_iterator->getRuleStatus();
|
| + // Keep return values in sync with JavaScript BreakType enum.
|
| + v8::Handle<v8::String> result;
|
| + if (status >= UBRK_WORD_NONE && status < UBRK_WORD_NONE_LIMIT) {
|
| + result = v8::String::New("none");
|
| + } else if (status >= UBRK_WORD_NUMBER && status < UBRK_WORD_NUMBER_LIMIT) {
|
| + result = v8::String::New("number");
|
| + } else if (status >= UBRK_WORD_LETTER && status < UBRK_WORD_LETTER_LIMIT) {
|
| + result = v8::String::New("letter");
|
| + } else if (status >= UBRK_WORD_KANA && status < UBRK_WORD_KANA_LIMIT) {
|
| + result = v8::String::New("kana");
|
| + } else if (status >= UBRK_WORD_IDEO && status < UBRK_WORD_IDEO_LIMIT) {
|
| + result = v8::String::New("ideo");
|
| + } else {
|
| + result = v8::String::New("unknown");
|
| + }
|
| + args.GetReturnValue().Set(result);
|
| +}
|
| +
|
| +void BreakIterator::JSCreateBreakIterator(
|
| + const v8::FunctionCallbackInfo<v8::Value>& args) {
|
| + if (args.Length() != 3 || !args[0]->IsString() || !args[1]->IsObject() ||
|
| + !args[2]->IsObject()) {
|
| + v8::ThrowException(v8::Exception::Error(
|
| + v8::String::New("Internal error, wrong parameters.")));
|
| + return;
|
| + }
|
| +
|
| + v8::Isolate* isolate = args.GetIsolate();
|
| + v8::Local<v8::ObjectTemplate> break_iterator_template =
|
| + Utils::GetTemplate2(isolate);
|
| +
|
| + // Create an empty object wrapper.
|
| + v8::Local<v8::Object> local_object = break_iterator_template->NewInstance();
|
| + // But the handle shouldn't be empty.
|
| + // That can happen if there was a stack overflow when creating the object.
|
| + if (local_object.IsEmpty()) {
|
| + args.GetReturnValue().Set(local_object);
|
| + return;
|
| + }
|
| +
|
| + // Set break iterator as internal field of the resulting JS object.
|
| + icu::BreakIterator* break_iterator = InitializeBreakIterator(
|
| + args[0]->ToString(), args[1]->ToObject(), args[2]->ToObject());
|
| +
|
| + if (!break_iterator) {
|
| + v8::ThrowException(v8::Exception::Error(v8::String::New(
|
| + "Internal error. Couldn't create ICU break iterator.")));
|
| + return;
|
| + } else {
|
| + local_object->SetAlignedPointerInInternalField(0, break_iterator);
|
| + // Make sure that the pointer to adopted text is NULL.
|
| + local_object->SetAlignedPointerInInternalField(1, NULL);
|
| +
|
| + v8::TryCatch try_catch;
|
| + local_object->Set(v8::String::New("breakIterator"),
|
| + v8::String::New("valid"));
|
| + if (try_catch.HasCaught()) {
|
| + v8::ThrowException(v8::Exception::Error(
|
| + v8::String::New("Internal error, couldn't set property.")));
|
| + return;
|
| + }
|
| + }
|
| +
|
| + v8::Persistent<v8::Object> wrapper(isolate, local_object);
|
| + // Make object handle weak so we can delete iterator once GC kicks in.
|
| + wrapper.MakeWeak<void>(NULL, &DeleteBreakIterator);
|
| + args.GetReturnValue().Set(wrapper);
|
| + wrapper.ClearAndLeak();
|
| +}
|
| +
|
| +static icu::BreakIterator* InitializeBreakIterator(
|
| + v8::Handle<v8::String> locale,
|
| + v8::Handle<v8::Object> options,
|
| + v8::Handle<v8::Object> resolved) {
|
| + // Convert BCP47 into ICU locale format.
|
| + UErrorCode status = U_ZERO_ERROR;
|
| + icu::Locale icu_locale;
|
| + char icu_result[ULOC_FULLNAME_CAPACITY];
|
| + int icu_length = 0;
|
| + v8::String::AsciiValue bcp47_locale(locale);
|
| + if (bcp47_locale.length() != 0) {
|
| + uloc_forLanguageTag(*bcp47_locale, icu_result, ULOC_FULLNAME_CAPACITY,
|
| + &icu_length, &status);
|
| + if (U_FAILURE(status) || icu_length == 0) {
|
| + return NULL;
|
| + }
|
| + icu_locale = icu::Locale(icu_result);
|
| + }
|
| +
|
| + icu::BreakIterator* break_iterator =
|
| + CreateICUBreakIterator(icu_locale, options);
|
| + if (!break_iterator) {
|
| + // Remove extensions and try again.
|
| + icu::Locale no_extension_locale(icu_locale.getBaseName());
|
| + break_iterator = CreateICUBreakIterator(no_extension_locale, options);
|
| +
|
| + // Set resolved settings (locale).
|
| + SetResolvedSettings(no_extension_locale, break_iterator, resolved);
|
| + } else {
|
| + SetResolvedSettings(icu_locale, break_iterator, resolved);
|
| + }
|
| +
|
| + return break_iterator;
|
| +}
|
| +
|
| +static icu::BreakIterator* CreateICUBreakIterator(
|
| + const icu::Locale& icu_locale, v8::Handle<v8::Object> options) {
|
| + UErrorCode status = U_ZERO_ERROR;
|
| + icu::BreakIterator* break_iterator = NULL;
|
| + icu::UnicodeString type;
|
| + if (!Utils::ExtractStringSetting(options, "type", &type)) {
|
| + // Type had to be in the options. This would be an internal error.
|
| + return NULL;
|
| + }
|
| +
|
| + if (type == UNICODE_STRING_SIMPLE("character")) {
|
| + break_iterator =
|
| + icu::BreakIterator::createCharacterInstance(icu_locale, status);
|
| + } else if (type == UNICODE_STRING_SIMPLE("sentence")) {
|
| + break_iterator =
|
| + icu::BreakIterator::createSentenceInstance(icu_locale, status);
|
| + } else if (type == UNICODE_STRING_SIMPLE("line")) {
|
| + break_iterator =
|
| + icu::BreakIterator::createLineInstance(icu_locale, status);
|
| + } else {
|
| + // Defualt is word iterator.
|
| + break_iterator =
|
| + icu::BreakIterator::createWordInstance(icu_locale, status);
|
| + }
|
| +
|
| + if (U_FAILURE(status)) {
|
| + delete break_iterator;
|
| + return NULL;
|
| + }
|
| +
|
| + return break_iterator;
|
| +}
|
| +
|
| +static void SetResolvedSettings(const icu::Locale& icu_locale,
|
| + icu::BreakIterator* date_format,
|
| + v8::Handle<v8::Object> resolved) {
|
| + UErrorCode status = U_ZERO_ERROR;
|
| +
|
| + // Set the locale
|
| + char result[ULOC_FULLNAME_CAPACITY];
|
| + status = U_ZERO_ERROR;
|
| + uloc_toLanguageTag(
|
| + icu_locale.getName(), result, ULOC_FULLNAME_CAPACITY, FALSE, &status);
|
| + if (U_SUCCESS(status)) {
|
| + resolved->Set(v8::String::New("locale"), v8::String::New(result));
|
| + } else {
|
| + // This would never happen, since we got the locale from ICU.
|
| + resolved->Set(v8::String::New("locale"), v8::String::New("und"));
|
| + }
|
| +}
|
| +
|
| +} // namespace v8_i18n
|
|
|