php-src/ext/intl/intl_convert.c

155 lines
4.9 KiB
C
Raw Normal View History

2008-07-07 22:51:04 +00:00
/*
+----------------------------------------------------------------------+
2014-09-19 16:33:14 +00:00
| PHP Version 7 |
2008-07-07 22:51:04 +00:00
+----------------------------------------------------------------------+
| This source file is subject to version 3.01 of the PHP license, |
| that is bundled with this package in the file LICENSE, and is |
| available through the world-wide-web at the following url: |
| http://www.php.net/license/3_01.txt |
| If you did not receive a copy of the PHP license and are unable to |
| obtain it through the world-wide-web, please send a note to |
| license@php.net so we can mail you a copy immediately. |
+----------------------------------------------------------------------+
| Authors: Vadim Savchuk <vsavchuk@productengine.com> |
| Dmitry Lakhtyuk <dlakhtyuk@productengine.com> |
+----------------------------------------------------------------------+
*/
#ifdef HAVE_CONFIG_H
#include "config.h"
#endif
#include <php.h>
#include "intl_common.h"
#include "intl_convert.h"
/* {{{ intl_convert_utf8_to_utf16
* Convert given string from UTF-8 to UTF-16 to *target buffer.
*
* It *target is NULL then we allocate a large enough buffer,
* store the converted string into it, and make target point to it.
*
* Otherwise, if *target is non-NULL, we assume that it points to a
* dynamically allocated buffer of *target_len bytes length.
* In this case the buffer will be used to store the converted string to,
* and may be resized (made larger) if needed.
*
2014-12-29 10:17:15 +00:00
* Note that ICU uses int32_t as string length and PHP uses size_t. While
* it is not likely in practical situations to have strings longer than
* INT32_MAX, these are different types and need to be handled carefully.
*
2008-07-07 22:51:04 +00:00
* @param target Where to place the result.
* @param target_len Result length.
* @param source String to convert.
* @param source_len Length of the source string.
* @param status Conversion status.
*
* @return void This function does not return anything.
*/
void intl_convert_utf8_to_utf16(
2014-12-29 10:17:15 +00:00
UChar** target, int32_t* target_len,
const char* src, size_t src_len,
2008-07-07 22:51:04 +00:00
UErrorCode* status )
{
UChar* dst_buf = NULL;
int32_t dst_len = 0;
2008-07-07 22:51:04 +00:00
/* If *target is NULL determine required destination buffer size (pre-flighting).
* Otherwise, attempt to convert source string; if *target buffer is not large enough
* it will be resized appropriately.
*/
2008-07-07 22:51:04 +00:00
*status = U_ZERO_ERROR;
2014-12-29 10:17:15 +00:00
if(src_len > INT32_MAX) {
/* we can not fit this string */
*status = U_BUFFER_OVERFLOW_ERROR;
return;
}
u_strFromUTF8( *target, *target_len, &dst_len, src, (int32_t)src_len, status );
2008-07-07 22:51:04 +00:00
if( *status == U_ZERO_ERROR )
{
/* String is converted successfully */
2008-07-07 22:51:04 +00:00
(*target)[dst_len] = 0;
*target_len = dst_len;
return;
}
/* Bail out if an unexpected error occurred.
* (U_BUFFER_OVERFLOW_ERROR means that *target buffer is not large enough).
* (U_STRING_NOT_TERMINATED_WARNING usually means that the input string is empty).
*/
2008-07-07 22:51:04 +00:00
if( *status != U_BUFFER_OVERFLOW_ERROR && *status != U_STRING_NOT_TERMINATED_WARNING )
return;
/* Allocate memory for the destination buffer (it will be zero-terminated). */
2008-07-07 22:51:04 +00:00
dst_buf = eumalloc( dst_len + 1 );
/* Convert source string from UTF-8 to UTF-16. */
2008-07-07 22:51:04 +00:00
*status = U_ZERO_ERROR;
u_strFromUTF8( dst_buf, dst_len+1, NULL, src, src_len, status );
if( U_FAILURE( *status ) )
{
efree( dst_buf );
return;
}
dst_buf[dst_len] = 0;
if( *target )
efree( *target );
*target = dst_buf;
*target_len = dst_len;
}
/* }}} */
/* {{{ intl_convert_utf16_to_utf8
* Convert given string from UTF-16 to UTF-8.
*
* @param source String to convert.
* @param source_len Length of the source string.
* @param status Conversion status.
*
2015-07-01 10:26:39 +00:00
* @return zend_string
2008-07-07 22:51:04 +00:00
*/
2015-07-01 10:26:39 +00:00
zend_string* intl_convert_utf16_to_utf8(
2014-12-29 10:17:15 +00:00
const UChar* src, int32_t src_len,
2008-07-07 22:51:04 +00:00
UErrorCode* status )
{
2015-07-01 10:26:39 +00:00
zend_string* dst;
int32_t dst_len;
2008-07-07 22:51:04 +00:00
/* Determine required destination buffer size (pre-flighting). */
2008-07-07 22:51:04 +00:00
*status = U_ZERO_ERROR;
u_strToUTF8( NULL, 0, &dst_len, src, src_len, status );
/* Bail out if an unexpected error occurred.
* (U_BUFFER_OVERFLOW_ERROR means that *target buffer is not large enough).
* (U_STRING_NOT_TERMINATED_WARNING usually means that the input string is empty).
*/
2008-07-07 22:51:04 +00:00
if( *status != U_BUFFER_OVERFLOW_ERROR && *status != U_STRING_NOT_TERMINATED_WARNING )
2015-07-01 10:26:39 +00:00
return NULL;
2008-07-07 22:51:04 +00:00
/* Allocate memory for the destination buffer (it will be zero-terminated). */
2015-07-01 10:26:39 +00:00
dst = zend_string_alloc(dst_len, 0);
2008-07-07 22:51:04 +00:00
/* Convert source string from UTF-8 to UTF-16. */
2008-07-07 22:51:04 +00:00
*status = U_ZERO_ERROR;
2015-07-01 10:26:39 +00:00
u_strToUTF8( ZSTR_VAL(dst), dst_len, NULL, src, src_len, status );
2008-07-07 22:51:04 +00:00
if( U_FAILURE( *status ) )
{
zend_string_efree(dst);
2015-07-01 10:26:39 +00:00
return NULL;
2008-07-07 22:51:04 +00:00
}
/* U_STRING_NOT_TERMINATED_WARNING is OK for us => reset 'status'. */
2008-07-07 22:51:04 +00:00
*status = U_ZERO_ERROR;
2015-07-01 10:26:39 +00:00
ZSTR_VAL(dst)[dst_len] = 0;
return dst;
2008-07-07 22:51:04 +00:00
}
/* }}} */