php-src/Zend/zend_multibyte.c
Christoph M. Becker c8955c078a
Revert GH-10220
Cf. <https://github.com/php/php-src/pull/10220#issuecomment-1383739816>.

This reverts commit ecc880f491.
This reverts commit 588a07f737.
This reverts commit f377e15751.
This reverts commit b4ba16fe18.
This reverts commit 694ec1deea.
This reverts commit 6b34de8eba.
This reverts commit aa1cd02a43.
This reverts commit 308fd311ea.
This reverts commit 16203b53e1.
This reverts commit 738fb5ca54.
This reverts commit 9fdbefacd3.
This reverts commit cd4a7c1d90.
This reverts commit 928685eba2.
This reverts commit 01e5ffc85c.
2023-01-16 12:27:33 +01:00

213 lines
7.2 KiB
C

/*
+----------------------------------------------------------------------+
| Zend Engine |
+----------------------------------------------------------------------+
| Copyright (c) Zend Technologies Ltd. (http://www.zend.com) |
+----------------------------------------------------------------------+
| This source file is subject to version 2.00 of the Zend license, |
| that is bundled with this package in the file LICENSE, and is |
| available through the world-wide-web at |
| http://www.zend.com/license/2_00.txt. |
| If you did not receive a copy of the Zend license and are unable to |
| obtain it through the world-wide-web, please send a note to |
| license@zend.com so we can mail you a copy immediately. |
+----------------------------------------------------------------------+
| Authors: Masaki Fujimoto <fujimoto@php.net> |
| Rui Hirokawa <hirokawa@php.net> |
+----------------------------------------------------------------------+
*/
#include "zend.h"
#include "zend_compile.h"
#include "zend_operators.h"
#include "zend_multibyte.h"
#include "zend_ini.h"
static const zend_encoding *dummy_encoding_fetcher(const char *encoding_name)
{
return NULL;
}
static const char *dummy_encoding_name_getter(const zend_encoding *encoding)
{
return (const char*)encoding;
}
static bool dummy_encoding_lexer_compatibility_checker(const zend_encoding *encoding)
{
return 0;
}
static const zend_encoding *dummy_encoding_detector(const unsigned char *string, size_t length, const zend_encoding **list, size_t list_size)
{
return NULL;
}
static size_t dummy_encoding_converter(unsigned char **to, size_t *to_length, const unsigned char *from, size_t from_length, const zend_encoding *encoding_to, const zend_encoding *encoding_from)
{
return (size_t)-1;
}
static zend_result dummy_encoding_list_parser(const char *encoding_list, size_t encoding_list_len, const zend_encoding ***return_list, size_t *return_size, bool persistent)
{
*return_list = pemalloc(0, persistent);
*return_size = 0;
return SUCCESS;
}
static const zend_encoding *dummy_internal_encoding_getter(void)
{
return NULL;
}
static zend_result dummy_internal_encoding_setter(const zend_encoding *encoding)
{
return FAILURE;
}
static zend_multibyte_functions multibyte_functions_dummy;
static zend_multibyte_functions multibyte_functions = {
NULL,
dummy_encoding_fetcher,
dummy_encoding_name_getter,
dummy_encoding_lexer_compatibility_checker,
dummy_encoding_detector,
dummy_encoding_converter,
dummy_encoding_list_parser,
dummy_internal_encoding_getter,
dummy_internal_encoding_setter
};
ZEND_API const zend_encoding *zend_multibyte_encoding_utf32be = (const zend_encoding*)"UTF-32BE";
ZEND_API const zend_encoding *zend_multibyte_encoding_utf32le = (const zend_encoding*)"UTF-32LE";
ZEND_API const zend_encoding *zend_multibyte_encoding_utf16be = (const zend_encoding*)"UTF-16BE";
ZEND_API const zend_encoding *zend_multibyte_encoding_utf16le = (const zend_encoding*)"UTF-32LE";
ZEND_API const zend_encoding *zend_multibyte_encoding_utf8 = (const zend_encoding*)"UTF-8";
ZEND_API zend_result zend_multibyte_set_functions(const zend_multibyte_functions *functions)
{
zend_multibyte_encoding_utf32be = functions->encoding_fetcher("UTF-32BE");
if (!zend_multibyte_encoding_utf32be) {
return FAILURE;
}
zend_multibyte_encoding_utf32le = functions->encoding_fetcher("UTF-32LE");
if (!zend_multibyte_encoding_utf32le) {
return FAILURE;
}
zend_multibyte_encoding_utf16be = functions->encoding_fetcher("UTF-16BE");
if (!zend_multibyte_encoding_utf16be) {
return FAILURE;
}
zend_multibyte_encoding_utf16le = functions->encoding_fetcher("UTF-16LE");
if (!zend_multibyte_encoding_utf16le) {
return FAILURE;
}
zend_multibyte_encoding_utf8 = functions->encoding_fetcher("UTF-8");
if (!zend_multibyte_encoding_utf8) {
return FAILURE;
}
multibyte_functions_dummy = multibyte_functions;
multibyte_functions = *functions;
/* As zend_multibyte_set_functions() gets called after ini settings were
* populated, we need to reinitialize script_encoding here.
*/
{
const char *value = zend_ini_string("zend.script_encoding", sizeof("zend.script_encoding") - 1, 0);
zend_multibyte_set_script_encoding_by_string(value, strlen(value));
}
return SUCCESS;
}
ZEND_API void zend_multibyte_restore_functions(void)
{
multibyte_functions = multibyte_functions_dummy;
}
ZEND_API const zend_multibyte_functions *zend_multibyte_get_functions(void)
{
return multibyte_functions.provider_name ? &multibyte_functions: NULL;
}
ZEND_API const zend_encoding *zend_multibyte_fetch_encoding(const char *name)
{
return multibyte_functions.encoding_fetcher(name);
}
ZEND_API const char *zend_multibyte_get_encoding_name(const zend_encoding *encoding)
{
return multibyte_functions.encoding_name_getter(encoding);
}
ZEND_API int zend_multibyte_check_lexer_compatibility(const zend_encoding *encoding)
{
return multibyte_functions.lexer_compatibility_checker(encoding);
}
ZEND_API const zend_encoding *zend_multibyte_encoding_detector(const unsigned char *string, size_t length, const zend_encoding **list, size_t list_size)
{
return multibyte_functions.encoding_detector(string, length, list, list_size);
}
ZEND_API size_t zend_multibyte_encoding_converter(unsigned char **to, size_t *to_length, const unsigned char *from, size_t from_length, const zend_encoding *encoding_to, const zend_encoding *encoding_from)
{
return multibyte_functions.encoding_converter(to, to_length, from, from_length, encoding_to, encoding_from);
}
ZEND_API zend_result zend_multibyte_parse_encoding_list(const char *encoding_list, size_t encoding_list_len, const zend_encoding ***return_list, size_t *return_size, bool persistent)
{
return multibyte_functions.encoding_list_parser(encoding_list, encoding_list_len, return_list, return_size, persistent);
}
ZEND_API const zend_encoding *zend_multibyte_get_internal_encoding(void)
{
return multibyte_functions.internal_encoding_getter();
}
ZEND_API const zend_encoding *zend_multibyte_get_script_encoding(void)
{
return LANG_SCNG(script_encoding);
}
ZEND_API int zend_multibyte_set_script_encoding(const zend_encoding **encoding_list, size_t encoding_list_size)
{
if (CG(script_encoding_list)) {
free((char*)CG(script_encoding_list));
}
CG(script_encoding_list) = encoding_list;
CG(script_encoding_list_size) = encoding_list_size;
return SUCCESS;
}
ZEND_API zend_result zend_multibyte_set_internal_encoding(const zend_encoding *encoding)
{
return multibyte_functions.internal_encoding_setter(encoding);
}
ZEND_API zend_result zend_multibyte_set_script_encoding_by_string(const char *new_value, size_t new_value_length)
{
const zend_encoding **list = 0;
size_t size = 0;
if (!new_value) {
zend_multibyte_set_script_encoding(NULL, 0);
return SUCCESS;
}
if (FAILURE == zend_multibyte_parse_encoding_list(new_value, new_value_length, &list, &size, 1)) {
return FAILURE;
}
if (size == 0) {
pefree((void*)list, 1);
return FAILURE;
}
if (FAILURE == zend_multibyte_set_script_encoding(list, size)) {
return FAILURE;
}
return SUCCESS;
}