| // Copyright (c) 2010 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "webkit/glue/plugins/pepper_char_set.h" |
| |
| #include <stdlib.h> |
| |
| #include "base/i18n/icu_string_conversions.h" |
| #include "ppapi/c/dev/ppb_char_set_dev.h" |
| #include "unicode/ucnv.h" |
| #include "unicode/ucnv_cb.h" |
| #include "unicode/ucnv_err.h" |
| #include "unicode/ustring.h" |
| #include "webkit/glue/plugins/pepper_plugin_delegate.h" |
| #include "webkit/glue/plugins/pepper_plugin_instance.h" |
| #include "webkit/glue/plugins/pepper_plugin_module.h" |
| #include "webkit/glue/plugins/pepper_var.h" |
| |
| namespace pepper { |
| |
| namespace { |
| |
| // Converts the given PP error handling behavior to the version in base, |
| // placing the result in |*result| and returning true on success. Returns false |
| // if the enum is invalid. |
| bool PPToBaseConversionError(PP_CharSet_ConversionError on_error, |
| base::OnStringConversionError::Type* result) { |
| switch (on_error) { |
| case PP_CHARSET_CONVERSIONERROR_FAIL: |
| *result = base::OnStringConversionError::FAIL; |
| return true; |
| case PP_CHARSET_CONVERSIONERROR_SKIP: |
| *result = base::OnStringConversionError::SKIP; |
| return true; |
| case PP_CHARSET_CONVERSIONERROR_SUBSTITUTE: |
| *result = base::OnStringConversionError::SUBSTITUTE; |
| return true; |
| default: |
| return false; |
| } |
| } |
| |
| // The "substitution" behavior of this function does not match the |
| // implementation in base, so we partially duplicate the code from |
| // icu_string_conversions.cc with the correct error handling setup required |
| // by this pepper interface. |
| char* UTF16ToCharSet(const uint16_t* utf16, uint32_t utf16_len, |
| const char* output_char_set, |
| PP_CharSet_ConversionError on_error, |
| uint32_t* output_length) { |
| *output_length = 0; |
| |
| UErrorCode status = U_ZERO_ERROR; |
| UConverter* converter = ucnv_open(output_char_set, &status); |
| if (!U_SUCCESS(status)) |
| return NULL; |
| |
| int encoded_max_length = UCNV_GET_MAX_BYTES_FOR_STRING(utf16_len, |
| ucnv_getMaxCharSize(converter)); |
| |
| // Setup our error handler. |
| switch (on_error) { |
| case PP_CHARSET_CONVERSIONERROR_FAIL: |
| ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_STOP, 0, |
| NULL, NULL, &status); |
| break; |
| case PP_CHARSET_CONVERSIONERROR_SKIP: |
| ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_SKIP, 0, |
| NULL, NULL, &status); |
| break; |
| case PP_CHARSET_CONVERSIONERROR_SUBSTITUTE: { |
| // ICU sets the substitution char for some character sets (like latin1) |
| // to be the ASCII "substitution character" (26). We want to use '?' |
| // instead for backwards-compat with Windows behavior. |
| char subst_chars[32]; |
| int8_t subst_chars_len = 32; |
| ucnv_getSubstChars(converter, subst_chars, &subst_chars_len, &status); |
| if (subst_chars_len == 1 && subst_chars[0] == 26) { |
| // Override to the question mark character if possible. When using |
| // setSubstString, the input is a Unicode character. The function will |
| // try to convert it to the destination character set and fail if that |
| // can not be converted to the destination character set. |
| // |
| // We just ignore any failure. If the dest char set has no |
| // representation for '?', then we'll just stick to the ICU default |
| // substitution character. |
| UErrorCode subst_status = U_ZERO_ERROR; |
| UChar question_mark = '?'; |
| ucnv_setSubstString(converter, &question_mark, 1, &subst_status); |
| } |
| |
| ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_SUBSTITUTE, 0, |
| NULL, NULL, &status); |
| break; |
| } |
| default: |
| return NULL; |
| } |
| |
| // ucnv_fromUChars returns size not including terminating null. |
| char* encoded = static_cast<char*>(malloc(encoded_max_length + 1)); |
| int actual_size = ucnv_fromUChars(converter, encoded, |
| encoded_max_length, reinterpret_cast<const UChar*>(utf16), utf16_len, |
| &status); |
| ucnv_close(converter); |
| if (!U_SUCCESS(status)) { |
| free(encoded); |
| return NULL; |
| } |
| encoded[actual_size] = 0; |
| *output_length = actual_size; |
| return encoded; |
| } |
| |
| uint16_t* CharSetToUTF16(const char* input, uint32_t input_len, |
| const char* input_char_set, |
| PP_CharSet_ConversionError on_error, |
| uint32_t* output_length) { |
| *output_length = 0; |
| |
| base::OnStringConversionError::Type base_on_error; |
| if (!PPToBaseConversionError(on_error, &base_on_error)) |
| return NULL; // Invalid enum value. |
| |
| // We can convert this call to the implementation in base to avoid code |
| // duplication, although this does introduce an extra copy of the data. |
| string16 output; |
| if (!base::CodepageToUTF16(std::string(input, input_len), input_char_set, |
| base_on_error, &output)) |
| return NULL; |
| |
| uint16_t* ret_buf = static_cast<uint16_t*>( |
| malloc((output.size() + 1) * sizeof(uint16_t))); |
| if (!ret_buf) |
| return NULL; |
| |
| *output_length = static_cast<uint32_t>(output.size()); |
| memcpy(ret_buf, output.c_str(), (output.size() + 1) * sizeof(uint16_t)); |
| return ret_buf; |
| } |
| |
| PP_Var GetDefaultCharSet(PP_Module pp_module) { |
| PluginModule* module = ResourceTracker::Get()->GetModule(pp_module); |
| if (!module) |
| return PP_MakeUndefined(); |
| |
| std::string encoding = |
| module->GetSomeInstance()->delegate()->GetDefaultEncoding(); |
| return StringVar::StringToPPVar(module, encoding); |
| } |
| |
| const PPB_CharSet_Dev ppb_charset = { |
| &UTF16ToCharSet, |
| &CharSetToUTF16, |
| &GetDefaultCharSet |
| }; |
| |
| } // namespace |
| |
| // static |
| const struct PPB_CharSet_Dev* CharSet::GetInterface() { |
| return &ppb_charset; |
| } |
| |
| } // namespace pepper |