Index: src/extensions/i18n/collator.cc |
diff --git a/src/extensions/i18n/collator.cc b/src/extensions/i18n/collator.cc |
new file mode 100644 |
index 0000000000000000000000000000000000000000..4ffa4145fb7dea76cda6787d05707e4f436f44e5 |
--- /dev/null |
+++ b/src/extensions/i18n/collator.cc |
@@ -0,0 +1,363 @@ |
+// Copyright 2013 the V8 project authors. All rights reserved. |
+// Redistribution and use in source and binary forms, with or without |
+// modification, are permitted provided that the following conditions are |
+// met: |
+// |
+// * Redistributions of source code must retain the above copyright |
+// notice, this list of conditions and the following disclaimer. |
+// * Redistributions in binary form must reproduce the above |
+// copyright notice, this list of conditions and the following |
+// disclaimer in the documentation and/or other materials provided |
+// with the distribution. |
+// * Neither the name of Google Inc. nor the names of its |
+// contributors may be used to endorse or promote products derived |
+// from this software without specific prior written permission. |
+// |
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
+// limitations under the License. |
+ |
+#include "collator.h" |
+ |
+#include "i18n-utils.h" |
+#include "unicode/coll.h" |
+#include "unicode/locid.h" |
+#include "unicode/ucol.h" |
+ |
+namespace v8_i18n { |
+ |
+static icu::Collator* InitializeCollator( |
+ v8::Handle<v8::String>, v8::Handle<v8::Object>, v8::Handle<v8::Object>); |
+ |
+static icu::Collator* CreateICUCollator( |
+ const icu::Locale&, v8::Handle<v8::Object>); |
+ |
+static bool SetBooleanAttribute( |
+ UColAttribute, const char*, v8::Handle<v8::Object>, icu::Collator*); |
+ |
+static void SetResolvedSettings( |
+ const icu::Locale&, icu::Collator*, v8::Handle<v8::Object>); |
+ |
+static void SetBooleanSetting( |
+ UColAttribute, icu::Collator*, const char*, v8::Handle<v8::Object>); |
+ |
+icu::Collator* Collator::UnpackCollator(v8::Handle<v8::Object> obj) { |
+ v8::HandleScope handle_scope; |
+ |
+ if (obj->HasOwnProperty(v8::String::New("collator"))) { |
+ return static_cast<icu::Collator*>( |
+ obj->GetAlignedPointerFromInternalField(0)); |
+ } |
+ |
+ return NULL; |
+} |
+ |
+void Collator::DeleteCollator(v8::Isolate* isolate, |
+ v8::Persistent<v8::Object>* object, |
+ void* param) { |
+ // First delete the hidden C++ object. |
+ // Unpacking should never return NULL here. That would only happen if |
+ // this method is used as the weak callback for persistent handles not |
+ // pointing to a collator. |
+ v8::HandleScope handle_scope(isolate); |
+ v8::Local<v8::Object> handle = v8::Local<v8::Object>::New(isolate, *object); |
+ delete UnpackCollator(handle); |
+ |
+ // Then dispose of the persistent handle to JS object. |
+ object->Dispose(isolate); |
+} |
+ |
+// Throws a JavaScript exception. |
+static v8::Handle<v8::Value> ThrowUnexpectedObjectError() { |
+ // Returns undefined, and schedules an exception to be thrown. |
+ return v8::ThrowException(v8::Exception::Error( |
+ v8::String::New("Collator method called on an object " |
+ "that is not a Collator."))); |
+} |
+ |
+// When there's an ICU error, throw a JavaScript error with |message|. |
+static v8::Handle<v8::Value> ThrowExceptionForICUError(const char* message) { |
+ return v8::ThrowException(v8::Exception::Error(v8::String::New(message))); |
+} |
+ |
+// static |
+void Collator::JSInternalCompare( |
+ const v8::FunctionCallbackInfo<v8::Value>& args) { |
+ if (args.Length() != 3 || !args[0]->IsObject() || |
+ !args[1]->IsString() || !args[2]->IsString()) { |
+ v8::ThrowException(v8::Exception::SyntaxError( |
+ v8::String::New("Collator and two string arguments are required."))); |
+ return; |
+ } |
+ |
+ icu::Collator* collator = UnpackCollator(args[0]->ToObject()); |
+ if (!collator) { |
+ ThrowUnexpectedObjectError(); |
+ return; |
+ } |
+ |
+ v8::String::Value string_value1(args[1]); |
+ v8::String::Value string_value2(args[2]); |
+ const UChar* string1 = reinterpret_cast<const UChar*>(*string_value1); |
+ const UChar* string2 = reinterpret_cast<const UChar*>(*string_value2); |
+ UErrorCode status = U_ZERO_ERROR; |
+ UCollationResult result = collator->compare( |
+ string1, string_value1.length(), string2, string_value2.length(), status); |
+ |
+ if (U_FAILURE(status)) { |
+ ThrowExceptionForICUError( |
+ "Internal error. Unexpected failure in Collator.compare."); |
+ return; |
+ } |
+ |
+ args.GetReturnValue().Set(result); |
+} |
+ |
+void Collator::JSCreateCollator( |
+ const v8::FunctionCallbackInfo<v8::Value>& args) { |
+ if (args.Length() != 3 || !args[0]->IsString() || !args[1]->IsObject() || |
+ !args[2]->IsObject()) { |
+ v8::ThrowException(v8::Exception::SyntaxError( |
+ v8::String::New("Internal error, wrong parameters."))); |
+ return; |
+ } |
+ |
+ v8::Isolate* isolate = args.GetIsolate(); |
+ v8::Local<v8::ObjectTemplate> intl_collator_template = |
+ Utils::GetTemplate(isolate); |
+ |
+ // Create an empty object wrapper. |
+ v8::Local<v8::Object> local_object = intl_collator_template->NewInstance(); |
+ // But the handle shouldn't be empty. |
+ // That can happen if there was a stack overflow when creating the object. |
+ if (local_object.IsEmpty()) { |
+ args.GetReturnValue().Set(local_object); |
+ return; |
+ } |
+ |
+ // Set collator as internal field of the resulting JS object. |
+ icu::Collator* collator = InitializeCollator( |
+ args[0]->ToString(), args[1]->ToObject(), args[2]->ToObject()); |
+ |
+ if (!collator) { |
+ v8::ThrowException(v8::Exception::Error(v8::String::New( |
+ "Internal error. Couldn't create ICU collator."))); |
+ return; |
+ } else { |
+ local_object->SetAlignedPointerInInternalField(0, collator); |
+ |
+ // Make it safer to unpack later on. |
+ v8::TryCatch try_catch; |
+ local_object->Set(v8::String::New("collator"), v8::String::New("valid")); |
+ if (try_catch.HasCaught()) { |
+ v8::ThrowException(v8::Exception::Error( |
+ v8::String::New("Internal error, couldn't set property."))); |
+ return; |
+ } |
+ } |
+ |
+ v8::Persistent<v8::Object> wrapper(isolate, local_object); |
+ // Make object handle weak so we can delete iterator once GC kicks in. |
+ wrapper.MakeWeak<void>(NULL, &DeleteCollator); |
+ args.GetReturnValue().Set(wrapper); |
+ wrapper.ClearAndLeak(); |
+} |
+ |
+static icu::Collator* InitializeCollator(v8::Handle<v8::String> locale, |
+ v8::Handle<v8::Object> options, |
+ v8::Handle<v8::Object> resolved) { |
+ // Convert BCP47 into ICU locale format. |
+ UErrorCode status = U_ZERO_ERROR; |
+ icu::Locale icu_locale; |
+ char icu_result[ULOC_FULLNAME_CAPACITY]; |
+ int icu_length = 0; |
+ v8::String::AsciiValue bcp47_locale(locale); |
+ if (bcp47_locale.length() != 0) { |
+ uloc_forLanguageTag(*bcp47_locale, icu_result, ULOC_FULLNAME_CAPACITY, |
+ &icu_length, &status); |
+ if (U_FAILURE(status) || icu_length == 0) { |
+ return NULL; |
+ } |
+ icu_locale = icu::Locale(icu_result); |
+ } |
+ |
+ icu::Collator* collator = CreateICUCollator(icu_locale, options); |
+ if (!collator) { |
+ // Remove extensions and try again. |
+ icu::Locale no_extension_locale(icu_locale.getBaseName()); |
+ collator = CreateICUCollator(no_extension_locale, options); |
+ |
+ // Set resolved settings (pattern, numbering system). |
+ SetResolvedSettings(no_extension_locale, collator, resolved); |
+ } else { |
+ SetResolvedSettings(icu_locale, collator, resolved); |
+ } |
+ |
+ return collator; |
+} |
+ |
+static icu::Collator* CreateICUCollator( |
+ const icu::Locale& icu_locale, v8::Handle<v8::Object> options) { |
+ // Make collator from options. |
+ icu::Collator* collator = NULL; |
+ UErrorCode status = U_ZERO_ERROR; |
+ collator = icu::Collator::createInstance(icu_locale, status); |
+ |
+ if (U_FAILURE(status)) { |
+ delete collator; |
+ return NULL; |
+ } |
+ |
+ // Set flags first, and then override them with sensitivity if necessary. |
+ SetBooleanAttribute(UCOL_NUMERIC_COLLATION, "numeric", options, collator); |
+ |
+ // Normalization is always on, by the spec. We are free to optimize |
+ // if the strings are already normalized (but we don't have a way to tell |
+ // that right now). |
+ collator->setAttribute(UCOL_NORMALIZATION_MODE, UCOL_ON, status); |
+ |
+ icu::UnicodeString case_first; |
+ if (Utils::ExtractStringSetting(options, "caseFirst", &case_first)) { |
+ if (case_first == UNICODE_STRING_SIMPLE("upper")) { |
+ collator->setAttribute(UCOL_CASE_FIRST, UCOL_UPPER_FIRST, status); |
+ } else if (case_first == UNICODE_STRING_SIMPLE("lower")) { |
+ collator->setAttribute(UCOL_CASE_FIRST, UCOL_LOWER_FIRST, status); |
+ } else { |
+ // Default (false/off). |
+ collator->setAttribute(UCOL_CASE_FIRST, UCOL_OFF, status); |
+ } |
+ } |
+ |
+ icu::UnicodeString sensitivity; |
+ if (Utils::ExtractStringSetting(options, "sensitivity", &sensitivity)) { |
+ if (sensitivity == UNICODE_STRING_SIMPLE("base")) { |
+ collator->setStrength(icu::Collator::PRIMARY); |
+ } else if (sensitivity == UNICODE_STRING_SIMPLE("accent")) { |
+ collator->setStrength(icu::Collator::SECONDARY); |
+ } else if (sensitivity == UNICODE_STRING_SIMPLE("case")) { |
+ collator->setStrength(icu::Collator::PRIMARY); |
+ collator->setAttribute(UCOL_CASE_LEVEL, UCOL_ON, status); |
+ } else { |
+ // variant (default) |
+ collator->setStrength(icu::Collator::TERTIARY); |
+ } |
+ } |
+ |
+ bool ignore; |
+ if (Utils::ExtractBooleanSetting(options, "ignorePunctuation", &ignore)) { |
+ if (ignore) { |
+ collator->setAttribute(UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, status); |
+ } |
+ } |
+ |
+ return collator; |
+} |
+ |
+static bool SetBooleanAttribute(UColAttribute attribute, |
+ const char* name, |
+ v8::Handle<v8::Object> options, |
+ icu::Collator* collator) { |
+ UErrorCode status = U_ZERO_ERROR; |
+ bool result; |
+ if (Utils::ExtractBooleanSetting(options, name, &result)) { |
+ collator->setAttribute(attribute, result ? UCOL_ON : UCOL_OFF, status); |
+ if (U_FAILURE(status)) { |
+ return false; |
+ } |
+ } |
+ |
+ return true; |
+} |
+ |
+static void SetResolvedSettings(const icu::Locale& icu_locale, |
+ icu::Collator* collator, |
+ v8::Handle<v8::Object> resolved) { |
+ SetBooleanSetting(UCOL_NUMERIC_COLLATION, collator, "numeric", resolved); |
+ |
+ UErrorCode status = U_ZERO_ERROR; |
+ |
+ switch (collator->getAttribute(UCOL_CASE_FIRST, status)) { |
+ case UCOL_LOWER_FIRST: |
+ resolved->Set(v8::String::New("caseFirst"), v8::String::New("lower")); |
+ break; |
+ case UCOL_UPPER_FIRST: |
+ resolved->Set(v8::String::New("caseFirst"), v8::String::New("upper")); |
+ break; |
+ default: |
+ resolved->Set(v8::String::New("caseFirst"), v8::String::New("false")); |
+ } |
+ |
+ switch (collator->getAttribute(UCOL_STRENGTH, status)) { |
+ case UCOL_PRIMARY: { |
+ resolved->Set(v8::String::New("strength"), v8::String::New("primary")); |
+ |
+ // case level: true + s1 -> case, s1 -> base. |
+ if (UCOL_ON == collator->getAttribute(UCOL_CASE_LEVEL, status)) { |
+ resolved->Set(v8::String::New("sensitivity"), v8::String::New("case")); |
+ } else { |
+ resolved->Set(v8::String::New("sensitivity"), v8::String::New("base")); |
+ } |
+ break; |
+ } |
+ case UCOL_SECONDARY: |
+ resolved->Set(v8::String::New("strength"), v8::String::New("secondary")); |
+ resolved->Set(v8::String::New("sensitivity"), v8::String::New("accent")); |
+ break; |
+ case UCOL_TERTIARY: |
+ resolved->Set(v8::String::New("strength"), v8::String::New("tertiary")); |
+ resolved->Set(v8::String::New("sensitivity"), v8::String::New("variant")); |
+ break; |
+ case UCOL_QUATERNARY: |
+ // We shouldn't get quaternary and identical from ICU, but if we do |
+ // put them into variant. |
+ resolved->Set(v8::String::New("strength"), v8::String::New("quaternary")); |
+ resolved->Set(v8::String::New("sensitivity"), v8::String::New("variant")); |
+ break; |
+ default: |
+ resolved->Set(v8::String::New("strength"), v8::String::New("identical")); |
+ resolved->Set(v8::String::New("sensitivity"), v8::String::New("variant")); |
+ } |
+ |
+ if (UCOL_SHIFTED == collator->getAttribute(UCOL_ALTERNATE_HANDLING, status)) { |
+ resolved->Set(v8::String::New("ignorePunctuation"), |
+ v8::Boolean::New(true)); |
+ } else { |
+ resolved->Set(v8::String::New("ignorePunctuation"), |
+ v8::Boolean::New(false)); |
+ } |
+ |
+ // Set the locale |
+ char result[ULOC_FULLNAME_CAPACITY]; |
+ status = U_ZERO_ERROR; |
+ uloc_toLanguageTag( |
+ icu_locale.getName(), result, ULOC_FULLNAME_CAPACITY, FALSE, &status); |
+ if (U_SUCCESS(status)) { |
+ resolved->Set(v8::String::New("locale"), v8::String::New(result)); |
+ } else { |
+ // This would never happen, since we got the locale from ICU. |
+ resolved->Set(v8::String::New("locale"), v8::String::New("und")); |
+ } |
+} |
+ |
+static void SetBooleanSetting(UColAttribute attribute, |
+ icu::Collator* collator, |
+ const char* property, |
+ v8::Handle<v8::Object> resolved) { |
+ UErrorCode status = U_ZERO_ERROR; |
+ if (UCOL_ON == collator->getAttribute(attribute, status)) { |
+ resolved->Set(v8::String::New(property), v8::Boolean::New(true)); |
+ } else { |
+ resolved->Set(v8::String::New(property), v8::Boolean::New(false)); |
+ } |
+} |
+ |
+} // namespace v8_i18n |