Index: ppapi/shared_impl/char_set_impl.cc |
diff --git a/ppapi/shared_impl/char_set_impl.cc b/ppapi/shared_impl/char_set_impl.cc |
new file mode 100644 |
index 0000000000000000000000000000000000000000..012f9d652adfebf3e9bb6a263d959413167db92d |
--- /dev/null |
+++ b/ppapi/shared_impl/char_set_impl.cc |
@@ -0,0 +1,153 @@ |
+// Copyright (c) 2011 The Chromium Authors. All rights reserved. |
+// Use of this source code is governed by a BSD-style license that can be |
+// found in the LICENSE file. |
+ |
+#include "ppapi/shared_impl/char_set_impl.h" |
+ |
+#include "base/i18n/icu_string_conversions.h" |
+#include "ppapi/c/ppb_core.h" |
+#include "unicode/ucnv.h" |
+#include "unicode/ucnv_cb.h" |
+#include "unicode/ucnv_err.h" |
+#include "unicode/ustring.h" |
+ |
+namespace pp { |
+namespace shared_impl { |
+ |
+namespace { |
+ |
+// Converts the given PP error handling behavior to the version in base, |
+// placing the result in |*result| and returning true on success. Returns false |
+// if the enum is invalid. |
+bool PPToBaseConversionError(PP_CharSet_ConversionError on_error, |
+ base::OnStringConversionError::Type* result) { |
+ switch (on_error) { |
+ case PP_CHARSET_CONVERSIONERROR_FAIL: |
+ *result = base::OnStringConversionError::FAIL; |
+ return true; |
+ case PP_CHARSET_CONVERSIONERROR_SKIP: |
+ *result = base::OnStringConversionError::SKIP; |
+ return true; |
+ case PP_CHARSET_CONVERSIONERROR_SUBSTITUTE: |
+ *result = base::OnStringConversionError::SUBSTITUTE; |
+ return true; |
+ default: |
+ return false; |
+ } |
+} |
+ |
+} // namespace |
+ |
+// static |
+// The "substitution" behavior of this function does not match the |
+// implementation in base, so we partially duplicate the code from |
+// icu_string_conversions.cc with the correct error handling setup required |
+// by the PPAPI interface. |
+char* CharSetImpl::UTF16ToCharSet(const PPB_Core* core, |
+ const uint16_t* utf16, |
+ uint32_t utf16_len, |
+ const char* output_char_set, |
+ PP_CharSet_ConversionError on_error, |
+ uint32_t* output_length) { |
+ if (!core || !utf16 || !output_char_set || !output_length) |
+ return NULL; |
+ |
+ *output_length = 0; |
+ |
+ UErrorCode status = U_ZERO_ERROR; |
+ UConverter* converter = ucnv_open(output_char_set, &status); |
+ if (!U_SUCCESS(status)) |
+ return NULL; |
+ |
+ int encoded_max_length = UCNV_GET_MAX_BYTES_FOR_STRING(utf16_len, |
+ ucnv_getMaxCharSize(converter)); |
+ |
+ // Setup our error handler. |
+ switch (on_error) { |
+ case PP_CHARSET_CONVERSIONERROR_FAIL: |
+ ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_STOP, 0, |
+ NULL, NULL, &status); |
+ break; |
+ case PP_CHARSET_CONVERSIONERROR_SKIP: |
+ ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_SKIP, 0, |
+ NULL, NULL, &status); |
+ break; |
+ case PP_CHARSET_CONVERSIONERROR_SUBSTITUTE: { |
+ // ICU sets the substitution char for some character sets (like latin1) |
+ // to be the ASCII "substitution character" (26). We want to use '?' |
+ // instead for backwards-compat with Windows behavior. |
+ char subst_chars[32]; |
+ int8_t subst_chars_len = 32; |
+ ucnv_getSubstChars(converter, subst_chars, &subst_chars_len, &status); |
+ if (subst_chars_len == 1 && subst_chars[0] == 26) { |
+ // Override to the question mark character if possible. When using |
+ // setSubstString, the input is a Unicode character. The function will |
+ // try to convert it to the destination character set and fail if that |
+ // can not be converted to the destination character set. |
+ // |
+ // We just ignore any failure. If the dest char set has no |
+ // representation for '?', then we'll just stick to the ICU default |
+ // substitution character. |
+ UErrorCode subst_status = U_ZERO_ERROR; |
+ UChar question_mark = '?'; |
+ ucnv_setSubstString(converter, &question_mark, 1, &subst_status); |
+ } |
+ |
+ ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_SUBSTITUTE, 0, |
+ NULL, NULL, &status); |
+ break; |
+ } |
+ default: |
+ return NULL; |
+ } |
+ |
+ // ucnv_fromUChars returns size not including terminating null. |
+ char* encoded = static_cast<char*>(core->MemAlloc(encoded_max_length + 1)); |
+ int actual_size = ucnv_fromUChars(converter, encoded, |
+ encoded_max_length, reinterpret_cast<const UChar*>(utf16), utf16_len, |
+ &status); |
+ ucnv_close(converter); |
+ if (!U_SUCCESS(status)) { |
+ core->MemFree(encoded); |
+ return NULL; |
+ } |
+ encoded[actual_size] = 0; |
+ *output_length = actual_size; |
+ return encoded; |
+} |
+ |
+// static |
+uint16_t* CharSetImpl::CharSetToUTF16(const PPB_Core* core, |
+ const char* input, |
+ uint32_t input_len, |
+ const char* input_char_set, |
+ PP_CharSet_ConversionError on_error, |
+ uint32_t* output_length) { |
+ if (!core || !input || !input_char_set || !output_length) |
+ return NULL; |
+ |
+ *output_length = 0; |
+ |
+ base::OnStringConversionError::Type base_on_error; |
+ if (!PPToBaseConversionError(on_error, &base_on_error)) |
+ return NULL; // Invalid enum value. |
+ |
+ // We can convert this call to the implementation in base to avoid code |
+ // duplication, although this does introduce an extra copy of the data. |
+ string16 output; |
+ if (!base::CodepageToUTF16(std::string(input, input_len), input_char_set, |
+ base_on_error, &output)) |
+ return NULL; |
+ |
+ uint16_t* ret_buf = static_cast<uint16_t*>( |
+ core->MemAlloc((output.size() + 1) * sizeof(uint16_t))); |
+ if (!ret_buf) |
+ return NULL; |
+ |
+ *output_length = static_cast<uint32_t>(output.size()); |
+ memcpy(ret_buf, output.c_str(), (output.size() + 1) * sizeof(uint16_t)); |
+ return ret_buf; |
+} |
+ |
+} // namespace shared_impl |
+} // namespace pp |