webkit/glue/plugins/pepper_char_set.cc - platform/external/chromium - Git at Google

 // Copyright (c) 2010 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "webkit/glue/plugins/pepper_char_set.h"

 #include <stdlib.h>

 #include "base/i18n/icu_string_conversions.h"
 #include "ppapi/c/dev/ppb_char_set_dev.h"
 #include "unicode/ucnv.h"
 #include "unicode/ucnv_cb.h"
 #include "unicode/ucnv_err.h"
 #include "unicode/ustring.h"
 #include "webkit/glue/plugins/pepper_plugin_delegate.h"
 #include "webkit/glue/plugins/pepper_plugin_instance.h"
 #include "webkit/glue/plugins/pepper_plugin_module.h"
 #include "webkit/glue/plugins/pepper_var.h"

 namespace pepper {

 namespace {

 // Converts the given PP error handling behavior to the version in base,
 // placing the result in |*result| and returning true on success. Returns false
 // if the enum is invalid.
 bool PPToBaseConversionError(PP_CharSet_ConversionError on_error,
                              base::OnStringConversionError::Type* result) {
   switch (on_error) {
     case PP_CHARSET_CONVERSIONERROR_FAIL:
       *result = base::OnStringConversionError::FAIL;
       return true;
     case PP_CHARSET_CONVERSIONERROR_SKIP:
       *result = base::OnStringConversionError::SKIP;
       return true;
     case PP_CHARSET_CONVERSIONERROR_SUBSTITUTE:
       *result = base::OnStringConversionError::SUBSTITUTE;
       return true;
     default:
       return false;
   }
 }

 // The "substitution" behavior of this function does not match the
 // implementation in base, so we partially duplicate the code from
 // icu_string_conversions.cc with the correct error handling setup required
 // by this pepper interface.
 char* UTF16ToCharSet(const uint16_t* utf16, uint32_t utf16_len,
                      const char* output_char_set,
                      PP_CharSet_ConversionError on_error,
                      uint32_t* output_length) {
   *output_length = 0;

   UErrorCode status = U_ZERO_ERROR;
   UConverter* converter = ucnv_open(output_char_set, &status);
   if (!U_SUCCESS(status))
     return NULL;

   int encoded_max_length = UCNV_GET_MAX_BYTES_FOR_STRING(utf16_len,
       ucnv_getMaxCharSize(converter));

   // Setup our error handler.
   switch (on_error) {
     case PP_CHARSET_CONVERSIONERROR_FAIL:
       ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_STOP, 0,
                             NULL, NULL, &status);
       break;
     case PP_CHARSET_CONVERSIONERROR_SKIP:
       ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_SKIP, 0,
                             NULL, NULL, &status);
       break;
     case PP_CHARSET_CONVERSIONERROR_SUBSTITUTE: {
       // ICU sets the substitution char for some character sets (like latin1)
       // to be the ASCII "substitution character" (26). We want to use '?'
       // instead for backwards-compat with Windows behavior.
       char subst_chars[32];
       int8_t subst_chars_len = 32;
       ucnv_getSubstChars(converter, subst_chars, &subst_chars_len, &status);
       if (subst_chars_len == 1 && subst_chars[0] == 26) {
         // Override to the question mark character if possible. When using
         // setSubstString, the input is a Unicode character. The function will
         // try to convert it to the destination character set and fail if that
         // can not be converted to the destination character set.
         //
         // We just ignore any failure. If the dest char set has no
         // representation for '?', then we'll just stick to the ICU default
         // substitution character.
         UErrorCode subst_status = U_ZERO_ERROR;
         UChar question_mark = '?';
         ucnv_setSubstString(converter, &question_mark, 1, &subst_status);
       }

       ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_SUBSTITUTE, 0,
                             NULL, NULL, &status);
       break;
     }
     default:
       return NULL;
   }

   // ucnv_fromUChars returns size not including terminating null.
   char* encoded = static_cast<char*>(malloc(encoded_max_length + 1));
   int actual_size = ucnv_fromUChars(converter, encoded,
       encoded_max_length, reinterpret_cast<const UChar*>(utf16), utf16_len,
       &status);
   ucnv_close(converter);
   if (!U_SUCCESS(status)) {
     free(encoded);
     return NULL;
   }
   encoded[actual_size] = 0;
   *output_length = actual_size;
   return encoded;
 }

 uint16_t* CharSetToUTF16(const char* input, uint32_t input_len,
                          const char* input_char_set,
                          PP_CharSet_ConversionError on_error,
                          uint32_t* output_length) {
   *output_length = 0;

   base::OnStringConversionError::Type base_on_error;
   if (!PPToBaseConversionError(on_error, &base_on_error))
     return NULL;  // Invalid enum value.

   // We can convert this call to the implementation in base to avoid code
   // duplication, although this does introduce an extra copy of the data.
   string16 output;
   if (!base::CodepageToUTF16(std::string(input, input_len), input_char_set,
                              base_on_error, &output))
     return NULL;

   uint16_t* ret_buf = static_cast<uint16_t*>(
       malloc((output.size() + 1) * sizeof(uint16_t)));
   if (!ret_buf)
     return NULL;

   *output_length = static_cast<uint32_t>(output.size());
   memcpy(ret_buf, output.c_str(), (output.size() + 1) * sizeof(uint16_t));
   return ret_buf;
 }

 PP_Var GetDefaultCharSet(PP_Module pp_module) {
   PluginModule* module = ResourceTracker::Get()->GetModule(pp_module);
   if (!module)
     return PP_MakeUndefined();

   std::string encoding =
       module->GetSomeInstance()->delegate()->GetDefaultEncoding();
   return StringVar::StringToPPVar(module, encoding);
 }

 const PPB_CharSet_Dev ppb_charset = {
   &UTF16ToCharSet,
   &CharSetToUTF16,
   &GetDefaultCharSet
 };

 }  // namespace

 // static
 const struct PPB_CharSet_Dev* CharSet::GetInterface() {
   return &ppb_charset;
 }

 }  // namespace pepper
	// Copyright (c) 2010 The Chromium Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "webkit/glue/plugins/pepper_char_set.h"

	#include <stdlib.h>

	#include "base/i18n/icu_string_conversions.h"
	#include "ppapi/c/dev/ppb_char_set_dev.h"
	#include "unicode/ucnv.h"
	#include "unicode/ucnv_cb.h"
	#include "unicode/ucnv_err.h"
	#include "unicode/ustring.h"
	#include "webkit/glue/plugins/pepper_plugin_delegate.h"
	#include "webkit/glue/plugins/pepper_plugin_instance.h"
	#include "webkit/glue/plugins/pepper_plugin_module.h"
	#include "webkit/glue/plugins/pepper_var.h"

	namespace pepper {

	namespace {

	// Converts the given PP error handling behavior to the version in base,
	// placing the result in \|*result\| and returning true on success. Returns false
	// if the enum is invalid.
	bool PPToBaseConversionError(PP_CharSet_ConversionError on_error,
	base::OnStringConversionError::Type* result) {
	switch (on_error) {
	case PP_CHARSET_CONVERSIONERROR_FAIL:
	*result = base::OnStringConversionError::FAIL;
	return true;
	case PP_CHARSET_CONVERSIONERROR_SKIP:
	*result = base::OnStringConversionError::SKIP;
	return true;
	case PP_CHARSET_CONVERSIONERROR_SUBSTITUTE:
	*result = base::OnStringConversionError::SUBSTITUTE;
	return true;
	default:
	return false;
	}
	}

	// The "substitution" behavior of this function does not match the
	// implementation in base, so we partially duplicate the code from
	// icu_string_conversions.cc with the correct error handling setup required
	// by this pepper interface.
	char* UTF16ToCharSet(const uint16_t* utf16, uint32_t utf16_len,
	const char* output_char_set,
	PP_CharSet_ConversionError on_error,
	uint32_t* output_length) {
	*output_length = 0;

	UErrorCode status = U_ZERO_ERROR;
	UConverter* converter = ucnv_open(output_char_set, &status);
	if (!U_SUCCESS(status))
	return NULL;

	int encoded_max_length = UCNV_GET_MAX_BYTES_FOR_STRING(utf16_len,
	ucnv_getMaxCharSize(converter));

	// Setup our error handler.
	switch (on_error) {
	case PP_CHARSET_CONVERSIONERROR_FAIL:
	ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_STOP, 0,
	NULL, NULL, &status);
	break;
	case PP_CHARSET_CONVERSIONERROR_SKIP:
	ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_SKIP, 0,
	NULL, NULL, &status);
	break;
	case PP_CHARSET_CONVERSIONERROR_SUBSTITUTE: {
	// ICU sets the substitution char for some character sets (like latin1)
	// to be the ASCII "substitution character" (26). We want to use '?'
	// instead for backwards-compat with Windows behavior.
	char subst_chars[32];
	int8_t subst_chars_len = 32;
	ucnv_getSubstChars(converter, subst_chars, &subst_chars_len, &status);
	if (subst_chars_len == 1 && subst_chars[0] == 26) {
	// Override to the question mark character if possible. When using
	// setSubstString, the input is a Unicode character. The function will
	// try to convert it to the destination character set and fail if that
	// can not be converted to the destination character set.
	//
	// We just ignore any failure. If the dest char set has no
	// representation for '?', then we'll just stick to the ICU default
	// substitution character.
	UErrorCode subst_status = U_ZERO_ERROR;
	UChar question_mark = '?';
	ucnv_setSubstString(converter, &question_mark, 1, &subst_status);
	}

	ucnv_setFromUCallBack(converter, UCNV_FROM_U_CALLBACK_SUBSTITUTE, 0,
	NULL, NULL, &status);
	break;
	}
	default:
	return NULL;
	}

	// ucnv_fromUChars returns size not including terminating null.
	char* encoded = static_cast<char*>(malloc(encoded_max_length + 1));
	int actual_size = ucnv_fromUChars(converter, encoded,
	encoded_max_length, reinterpret_cast<const UChar*>(utf16), utf16_len,
	&status);
	ucnv_close(converter);
	if (!U_SUCCESS(status)) {
	free(encoded);
	return NULL;
	}
	encoded[actual_size] = 0;
	*output_length = actual_size;
	return encoded;
	}

	uint16_t* CharSetToUTF16(const char* input, uint32_t input_len,
	const char* input_char_set,
	PP_CharSet_ConversionError on_error,
	uint32_t* output_length) {
	*output_length = 0;

	base::OnStringConversionError::Type base_on_error;
	if (!PPToBaseConversionError(on_error, &base_on_error))
	return NULL; // Invalid enum value.

	// We can convert this call to the implementation in base to avoid code
	// duplication, although this does introduce an extra copy of the data.
	string16 output;
	if (!base::CodepageToUTF16(std::string(input, input_len), input_char_set,
	base_on_error, &output))
	return NULL;

	uint16_t* ret_buf = static_cast<uint16_t*>(
	malloc((output.size() + 1) * sizeof(uint16_t)));
	if (!ret_buf)
	return NULL;

	*output_length = static_cast<uint32_t>(output.size());
	memcpy(ret_buf, output.c_str(), (output.size() + 1) * sizeof(uint16_t));
	return ret_buf;
	}

	PP_Var GetDefaultCharSet(PP_Module pp_module) {
	PluginModule* module = ResourceTracker::Get()->GetModule(pp_module);
	if (!module)
	return PP_MakeUndefined();

	std::string encoding =
	module->GetSomeInstance()->delegate()->GetDefaultEncoding();
	return StringVar::StringToPPVar(module, encoding);
	}

	const PPB_CharSet_Dev ppb_charset = {
	&UTF16ToCharSet,
	&CharSetToUTF16,
	&GetDefaultCharSet
	};

	} // namespace

	// static
	const struct PPB_CharSet_Dev* CharSet::GetInterface() {
	return &ppb_charset;
	}

	} // namespace pepper