mirror of
https://github.com/php/php-src.git
synced 2024-12-04 07:14:10 +08:00
1485 lines
39 KiB
C
1485 lines
39 KiB
C
/*
|
|
+----------------------------------------------------------------------+
|
|
| PHP version 4.0 |
|
|
+----------------------------------------------------------------------+
|
|
| Copyright (c) 1997, 1998, 1999 The PHP Group |
|
|
+----------------------------------------------------------------------+
|
|
| This source file is subject to version 2.0 of the PHP license, |
|
|
| that is bundled with this package in the file LICENSE, and is |
|
|
| available at through the world-wide-web at |
|
|
| http://www.php.net/license/2_0.txt. |
|
|
| If you did not receive a copy of the PHP license and are unable to |
|
|
| obtain it through the world-wide-web, please send a note to |
|
|
| license@php.net so we can mail you a copy immediately. |
|
|
+----------------------------------------------------------------------+
|
|
| Authors: Stig Sæther Bakken <ssb@fast.no> |
|
|
+----------------------------------------------------------------------+
|
|
*/
|
|
|
|
/* $Id$ */
|
|
#define IS_EXT_MODULE
|
|
|
|
/* boldly assume that if PIC is defined, we are being compiled dynamically */
|
|
#ifdef PIC
|
|
# define COMPILE_DL 1
|
|
#endif
|
|
|
|
#if COMPILE_DL
|
|
# include "dl/phpdl.h"
|
|
#endif
|
|
#include "php.h"
|
|
#include "php3_xml.h"
|
|
#include "zend_variables.h"
|
|
#include "ext/standard/php3_string.h"
|
|
|
|
|
|
#if HAVE_LIBEXPAT
|
|
|
|
# if !(WIN32|WINNT)
|
|
# include "build-defs.h"
|
|
# endif
|
|
# include "snprintf.h"
|
|
# include "ext/standard/head.h"
|
|
|
|
/* Short-term TODO list:
|
|
* - Implement XML_ExternalEntityParserCreate()
|
|
*/
|
|
|
|
/* Long-term TODO list:
|
|
* - Fix the expat library so you can install your own memory manager
|
|
* functions
|
|
*/
|
|
|
|
/* Known bugs:
|
|
* - Weird things happen with <![CDATA[]]> sections.
|
|
*/
|
|
|
|
|
|
#ifdef ZTS
|
|
int xml_globals_id;
|
|
#else
|
|
PHP_XML_API php_xml_globals xml_globals;
|
|
#endif
|
|
|
|
/* {{{ dynamically loadable module stuff */
|
|
|
|
# if COMPILE_DL
|
|
DLEXPORT zend_module_entry *get_module(void) { return &xml_module_entry; }
|
|
# endif /* COMPILE_DL */
|
|
|
|
/* }}} */
|
|
/* {{{ function prototypes */
|
|
|
|
/* {{{ php3i_long_pval() */
|
|
|
|
PHPAPI pval *php3i_long_pval(long value)
|
|
{
|
|
pval *ret;
|
|
MAKE_STD_ZVAL(ret);
|
|
|
|
ret->type = IS_LONG;
|
|
ret->value.lval = value;
|
|
return ret;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_double_pval() */
|
|
|
|
PHPAPI pval *php3i_double_pval(double value)
|
|
{
|
|
pval *ret;
|
|
MAKE_STD_ZVAL(ret);
|
|
|
|
ret->type = IS_DOUBLE;
|
|
ret->value.dval = value;
|
|
return ret;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_string_pval() */
|
|
|
|
PHPAPI pval *php3i_string_pval(const char *str)
|
|
{
|
|
pval *ret;
|
|
int len = strlen(str);
|
|
MAKE_STD_ZVAL(ret);
|
|
|
|
ret->type = IS_STRING;
|
|
ret->value.str.len = len;
|
|
ret->value.str.val = estrndup(str, len);
|
|
return ret;
|
|
}
|
|
|
|
/* }}} */
|
|
|
|
PHP_MINIT_FUNCTION(xml);
|
|
PHP_RINIT_FUNCTION(xml);
|
|
PHP_MSHUTDOWN_FUNCTION(xml);
|
|
PHP_RSHUTDOWN_FUNCTION(xml);
|
|
PHP_MINFO_FUNCTION(xml);
|
|
|
|
static void xml_destroy_parser(xml_parser *);
|
|
static void xml_set_handler(char **, pval *);
|
|
inline static unsigned short xml_encode_iso_8859_1(unsigned char);
|
|
inline static char xml_decode_iso_8859_1(unsigned short);
|
|
inline static unsigned short xml_encode_us_ascii(unsigned char);
|
|
inline static char xml_decode_us_ascii(unsigned short);
|
|
static XML_Char *xml_utf8_encode(const char *, int, int *, const XML_Char *);
|
|
static char *xml_utf8_decode(const XML_Char *, int, int *, const XML_Char *);
|
|
static pval *xml_call_handler(xml_parser *, char *, int, pval **);
|
|
static pval *php3i_xmlcharpval(const XML_Char *, int, const XML_Char *);
|
|
static int php3i_xmlcharlen(const XML_Char *);
|
|
static void php3i_add_to_info(xml_parser *parser,char *name);
|
|
|
|
|
|
void php3i_xml_startElementHandler(void *, const char *, const char **);
|
|
void php3i_xml_endElementHandler(void *, const char *);
|
|
void php3i_xml_characterDataHandler(void *, const XML_Char *, int);
|
|
void php3i_xml_processingInstructionHandler(void *, const XML_Char *, const XML_Char *);
|
|
void php3i_xml_defaultHandler(void *, const XML_Char *, int);
|
|
void php3i_xml_unparsedEntityDeclHandler(void *, const XML_Char *, const XML_Char *, const XML_Char *, const XML_Char *, const XML_Char *);
|
|
void php3i_xml_notationDeclHandler(void *, const XML_Char *, const XML_Char *, const XML_Char *, const XML_Char *);
|
|
int php3i_xml_externalEntityRefHandler(XML_Parser, const XML_Char *, const XML_Char *, const XML_Char *, const XML_Char *);
|
|
|
|
/* }}} */
|
|
/* {{{ extension definition structures */
|
|
|
|
function_entry xml_functions[] = {
|
|
PHP_FE(xml_parser_create, NULL)
|
|
PHP_FE(xml_set_element_handler, NULL)
|
|
PHP_FE(xml_set_character_data_handler, NULL)
|
|
PHP_FE(xml_set_processing_instruction_handler, NULL)
|
|
PHP_FE(xml_set_default_handler, NULL)
|
|
PHP_FE(xml_set_unparsed_entity_decl_handler, NULL)
|
|
PHP_FE(xml_set_notation_decl_handler, NULL)
|
|
PHP_FE(xml_set_external_entity_ref_handler, NULL)
|
|
PHP_FE(xml_parse, NULL)
|
|
PHP_FE(xml_parse_into_struct, NULL)
|
|
PHP_FE(xml_get_error_code, NULL)
|
|
PHP_FE(xml_error_string, NULL)
|
|
PHP_FE(xml_get_current_line_number, NULL)
|
|
PHP_FE(xml_get_current_column_number, NULL)
|
|
PHP_FE(xml_get_current_byte_index, NULL)
|
|
PHP_FE(xml_parser_free, NULL)
|
|
PHP_FE(xml_parser_set_option, NULL)
|
|
PHP_FE(xml_parser_get_option, NULL)
|
|
PHP_FE(utf8_encode, NULL)
|
|
PHP_FE(utf8_decode, NULL)
|
|
{NULL, NULL, NULL}
|
|
};
|
|
|
|
php3_module_entry xml_module_entry = {
|
|
"XML", /* extension name */
|
|
xml_functions, /* extension function list */
|
|
PHP_MINIT(xml), /* extension-wide startup function */
|
|
PHP_MSHUTDOWN(xml), /* extension-wide shutdown function */
|
|
PHP_RINIT(xml), /* per-request startup function */
|
|
PHP_RSHUTDOWN(xml), /* per-request shutdown function */
|
|
PHP_MINFO(xml), /* information function */
|
|
STANDARD_MODULE_PROPERTIES
|
|
};
|
|
|
|
/* All the encoding functions are set to NULL right now, since all
|
|
* the encoding is currently done internally by expat/xmltok.
|
|
*/
|
|
xml_encoding xml_encodings[] = {
|
|
{ "ISO-8859-1", xml_decode_iso_8859_1, xml_encode_iso_8859_1 },
|
|
{ "US-ASCII", xml_decode_us_ascii, xml_encode_us_ascii },
|
|
{ "UTF-8", NULL, NULL },
|
|
{ NULL, NULL, NULL }
|
|
};
|
|
|
|
/* True globals, no need for thread safety */
|
|
static int le_xml_parser;
|
|
|
|
/* }}} */
|
|
/* {{{ startup, shutdown and info functions */
|
|
|
|
/* {{{ php3_minit_xml */
|
|
|
|
#ifdef ZTS
|
|
static void php_xml_init_globals(php_xml_globals *xml_globals)
|
|
{
|
|
XML(default_encoding) = "ISO-8859-1";
|
|
}
|
|
#endif
|
|
|
|
PHP_MINIT_FUNCTION(xml)
|
|
{
|
|
|
|
ELS_FETCH();
|
|
|
|
le_xml_parser = register_list_destructors(xml_destroy_parser, NULL);
|
|
|
|
#ifdef ZTS
|
|
xml_globals_id = ts_allocate_id(sizeof(php_xml_globals), php_xml_init_globals, NULL);
|
|
#else
|
|
XML(default_encoding) = "ISO-8859-1";
|
|
#endif
|
|
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_NONE", XML_ERROR_NONE, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_NO_MEMORY", XML_ERROR_NO_MEMORY, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_SYNTAX", XML_ERROR_SYNTAX, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_NO_ELEMENTS", XML_ERROR_NO_ELEMENTS, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_INVALID_TOKEN", XML_ERROR_INVALID_TOKEN, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_UNCLOSED_TOKEN", XML_ERROR_UNCLOSED_TOKEN, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_PARTIAL_CHAR", XML_ERROR_PARTIAL_CHAR, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_TAG_MISMATCH", XML_ERROR_TAG_MISMATCH, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_DUPLICATE_ATTRIBUTE", XML_ERROR_DUPLICATE_ATTRIBUTE, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_JUNK_AFTER_DOC_ELEMENT", XML_ERROR_JUNK_AFTER_DOC_ELEMENT, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_PARAM_ENTITY_REF", XML_ERROR_PARAM_ENTITY_REF, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_UNDEFINED_ENTITY", XML_ERROR_UNDEFINED_ENTITY, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_RECURSIVE_ENTITY_REF", XML_ERROR_RECURSIVE_ENTITY_REF, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_ASYNC_ENTITY", XML_ERROR_ASYNC_ENTITY, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_BAD_CHAR_REF", XML_ERROR_BAD_CHAR_REF, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_BINARY_ENTITY_REF", XML_ERROR_BINARY_ENTITY_REF, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF", XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_MISPLACED_XML_PI", XML_ERROR_MISPLACED_XML_PI, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_UNKNOWN_ENCODING", XML_ERROR_UNKNOWN_ENCODING, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_INCORRECT_ENCODING", XML_ERROR_INCORRECT_ENCODING, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_UNCLOSED_CDATA_SECTION", XML_ERROR_UNCLOSED_CDATA_SECTION, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_ERROR_EXTERNAL_ENTITY_HANDLING", XML_ERROR_EXTERNAL_ENTITY_HANDLING, CONST_CS|CONST_PERSISTENT);
|
|
|
|
REGISTER_LONG_CONSTANT("XML_OPTION_CASE_FOLDING", PHP3_XML_OPTION_CASE_FOLDING, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_OPTION_TARGET_ENCODING", PHP3_XML_OPTION_TARGET_ENCODING, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_OPTION_SKIP_TAGSTART", PHP3_XML_OPTION_SKIP_TAGSTART, CONST_CS|CONST_PERSISTENT);
|
|
REGISTER_LONG_CONSTANT("XML_OPTION_SKIP_WHITE", PHP3_XML_OPTION_SKIP_WHITE, CONST_CS|CONST_PERSISTENT);
|
|
|
|
|
|
return SUCCESS;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3_rinit_xml */
|
|
|
|
PHP_RINIT_FUNCTION(xml)
|
|
{
|
|
return SUCCESS;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3_mshutdown_xml() */
|
|
|
|
PHP_MSHUTDOWN_FUNCTION(xml)
|
|
{
|
|
return SUCCESS;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3_rshutdown_xml() */
|
|
|
|
PHP_RSHUTDOWN_FUNCTION(xml)
|
|
{
|
|
return SUCCESS;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3_info_xml() */
|
|
|
|
PHP_MINFO_FUNCTION(xml)
|
|
{
|
|
PUTS("XML support active");
|
|
}
|
|
|
|
/* }}} */
|
|
|
|
/* }}} */
|
|
/* {{{ extension-internal functions */
|
|
|
|
/* {{{ xml_destroy_parser() */
|
|
|
|
static void
|
|
xml_destroy_parser(xml_parser *parser)
|
|
{
|
|
if (parser->parser) {
|
|
XML_ParserFree(parser->parser);
|
|
}
|
|
if (parser->ltags) {
|
|
efree(parser->ltags);
|
|
}
|
|
if (parser->startElementHandler) {
|
|
efree(parser->startElementHandler);
|
|
}
|
|
if (parser->endElementHandler) {
|
|
efree(parser->endElementHandler);
|
|
}
|
|
if (parser->characterDataHandler) {
|
|
efree(parser->characterDataHandler);
|
|
}
|
|
if (parser->processingInstructionHandler) {
|
|
efree(parser->processingInstructionHandler);
|
|
}
|
|
if (parser->defaultHandler) {
|
|
efree(parser->defaultHandler);
|
|
}
|
|
if (parser->unparsedEntityDeclHandler) {
|
|
efree(parser->unparsedEntityDeclHandler);
|
|
}
|
|
if (parser->notationDeclHandler) {
|
|
efree(parser->notationDeclHandler);
|
|
}
|
|
if (parser->externalEntityRefHandler) {
|
|
efree(parser->externalEntityRefHandler);
|
|
}
|
|
if (parser->unknownEncodingHandler) {
|
|
efree(parser->unknownEncodingHandler);
|
|
}
|
|
if (parser->baseURI) {
|
|
efree(parser->baseURI);
|
|
}
|
|
|
|
efree(parser);
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ xml_set_handler() */
|
|
|
|
static void
|
|
xml_set_handler(char **nameBufp, pval *data)
|
|
{
|
|
if (data->value.str.len > 0) {
|
|
if (*nameBufp != NULL) {
|
|
efree(*nameBufp);
|
|
}
|
|
convert_to_string(data);
|
|
*nameBufp = estrndup(data->value.str.val, data->value.str.len);
|
|
} else {
|
|
if (*nameBufp != NULL) {
|
|
efree(*nameBufp);
|
|
}
|
|
*nameBufp = NULL;
|
|
}
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ xml_call_handler() */
|
|
|
|
static pval *
|
|
xml_call_handler(xml_parser *parser, char *funcName, int argc, pval **argv)
|
|
{
|
|
ELS_FETCH();
|
|
|
|
if (parser && funcName) {
|
|
pval *retval, *func;
|
|
int i;
|
|
|
|
func = php3i_string_pval(funcName);
|
|
retval = emalloc(sizeof(pval));
|
|
/* We cannot call internal variables from a function module as
|
|
it breaks any chance of compiling it as a module on windows.
|
|
Instead, we create a callback function. */
|
|
if (call_user_function(EG(function_table), NULL, func, retval, argc, argv) == FAILURE) {
|
|
zval_dtor(retval);
|
|
efree(retval);
|
|
return NULL;
|
|
}
|
|
zval_dtor(func);
|
|
efree(func);
|
|
for (i = 0; i < argc; i++) {
|
|
zval_dtor(argv[i]);
|
|
efree(argv[i]);
|
|
}
|
|
return retval;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ xml_encode_iso_8859_1() */
|
|
|
|
inline static unsigned short
|
|
xml_encode_iso_8859_1(unsigned char c)
|
|
{
|
|
return (unsigned short)c;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ xml_decode_iso_8859_1() */
|
|
|
|
inline static char
|
|
xml_decode_iso_8859_1(unsigned short c)
|
|
{
|
|
return (char)(c > 0xff ? '?' : c);
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ xml_encode_us_ascii() */
|
|
|
|
inline static unsigned short
|
|
xml_encode_us_ascii(unsigned char c)
|
|
{
|
|
return (unsigned short)c;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ xml_decode_us_ascii() */
|
|
|
|
inline static char
|
|
xml_decode_us_ascii(unsigned short c)
|
|
{
|
|
return (char)(c > 0x7f ? '?' : c);
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ xml_get_encoding() */
|
|
|
|
static xml_encoding *
|
|
xml_get_encoding(const XML_Char *name)
|
|
{
|
|
xml_encoding *enc = &xml_encodings[0];
|
|
|
|
while (enc && enc->name) {
|
|
if (strcasecmp(name, enc->name) == 0) {
|
|
return enc;
|
|
}
|
|
enc++;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ xml_utf8_encode */
|
|
static XML_Char *
|
|
xml_utf8_encode(const char *s, int len, int *newlen, const XML_Char *encoding)
|
|
{
|
|
int pos = len;
|
|
char *newbuf;
|
|
unsigned short c;
|
|
unsigned short (*encoder)(unsigned char) = NULL;
|
|
xml_encoding *enc = xml_get_encoding(encoding);
|
|
|
|
*newlen = 0;
|
|
if (enc) {
|
|
encoder = enc->encoding_function;
|
|
} else {
|
|
/* If the target encoding was unknown, fail */
|
|
return NULL;
|
|
}
|
|
if (encoder == NULL) {
|
|
/* If no encoder function was specified, return the data as-is.
|
|
*/
|
|
newbuf = emalloc(len);
|
|
memcpy(newbuf, s, len);
|
|
*newlen = len;
|
|
return newbuf;
|
|
}
|
|
/* This is the theoretical max (will never get beyond len * 2 as long
|
|
* as we are converting from single-byte characters, though) */
|
|
newbuf = emalloc(len * 4);
|
|
while (pos > 0) {
|
|
c = encoder ? encoder((unsigned char)(*s)) : (unsigned short)(*s);
|
|
if (c < 0x80) {
|
|
newbuf[(*newlen)++] = c;
|
|
} else if (c < 0x800) {
|
|
newbuf[(*newlen)++] = (0xc0 | (c >> 6));
|
|
newbuf[(*newlen)++] = (0x80 | (c & 0x3f));
|
|
} else if (c < 0x10000) {
|
|
newbuf[(*newlen)++] = (0xe0 | (c >> 12));
|
|
newbuf[(*newlen)++] = (0xc0 | ((c >> 6) & 0x3f));
|
|
newbuf[(*newlen)++] = (0x80 | (c & 0x3f));
|
|
} else if (c < 0x200000) {
|
|
newbuf[(*newlen)++] = (0xf0 | (c >> 18));
|
|
newbuf[(*newlen)++] = (0xe0 | ((c >> 12) & 0x3f));
|
|
newbuf[(*newlen)++] = (0xc0 | ((c >> 6) & 0x3f));
|
|
newbuf[(*newlen)++] = (0x80 | (c & 0x3f));
|
|
}
|
|
pos--;
|
|
s++;
|
|
}
|
|
if (*newlen < len * 4) {
|
|
newbuf = erealloc(newbuf, *newlen);
|
|
}
|
|
return newbuf;
|
|
}
|
|
/* }}} */
|
|
/* {{{ xml_utf8_decode */
|
|
static char *
|
|
xml_utf8_decode(const XML_Char *s, int len, int *newlen, const XML_Char *encoding)
|
|
{
|
|
int pos = len;
|
|
char *newbuf = emalloc(len + 1);
|
|
unsigned short c;
|
|
char (*decoder)(unsigned short) = NULL;
|
|
xml_encoding *enc = xml_get_encoding(encoding);
|
|
|
|
*newlen = 0;
|
|
if (enc) {
|
|
decoder = enc->decoding_function;
|
|
}
|
|
if (decoder == NULL) {
|
|
/* If the target encoding was unknown, or no decoder function
|
|
* was specified, return the UTF-8-encoded data as-is.
|
|
*/
|
|
memcpy(newbuf, s, len);
|
|
*newlen = len;
|
|
newbuf[*newlen] = '\0';
|
|
return newbuf;
|
|
}
|
|
while (pos > 0) {
|
|
c = (unsigned char)(*s);
|
|
if (c >= 0xf0) { /* four bytes encoded, 21 bits */
|
|
c = ((s[0]&7)<<18) | ((s[1]&63)<<12) | ((s[2]&63)<<6) | (s[3]&63);
|
|
s += 4;
|
|
pos -= 4;
|
|
} else if (c >= 0xe0) { /* three bytes encoded, 16 bits */
|
|
c = ((s[0]&63)<<12) | ((s[1]&63)<<6) | (s[2]&63);
|
|
s += 3;
|
|
pos -= 3;
|
|
} else if (c >= 0xc0) { /* two bytes encoded, 11 bits */
|
|
c = ((s[0]&63)<<6) | (s[1]&63);
|
|
s += 2;
|
|
pos -= 2;
|
|
} else {
|
|
s++;
|
|
pos--;
|
|
}
|
|
newbuf[*newlen] = decoder ? decoder(c) : c;
|
|
++*newlen;
|
|
}
|
|
if (*newlen < len) {
|
|
newbuf = erealloc(newbuf, *newlen + 1);
|
|
}
|
|
newbuf[*newlen] = '\0';
|
|
return newbuf;
|
|
}
|
|
/* }}} */
|
|
/* {{{ php3i_xmlcharpval() */
|
|
|
|
static pval *php3i_xmlcharpval(const XML_Char *s, int len, const XML_Char *encoding)
|
|
{
|
|
pval *ret = emalloc(sizeof(pval));
|
|
|
|
if (s == NULL) {
|
|
var_reset(ret);
|
|
return ret;
|
|
}
|
|
if (len == 0) {
|
|
len = php3i_xmlcharlen(s);
|
|
}
|
|
ret->type = IS_STRING;
|
|
ret->value.str.val = xml_utf8_decode(s, len, &ret->value.str.len, encoding);
|
|
return ret;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xmlcharlen() */
|
|
|
|
static int php3i_xmlcharlen(const XML_Char *s)
|
|
{
|
|
int len = 0;
|
|
|
|
while (*s) {
|
|
len++;
|
|
s++;
|
|
}
|
|
return len;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_pval_strdup() */
|
|
|
|
PHPAPI char *php3i_pval_strdup(pval *val)
|
|
{
|
|
if (val->type == IS_STRING) {
|
|
char *buf = emalloc(val->value.str.len + 1);
|
|
memcpy(buf, val->value.str.val, val->value.str.len);
|
|
buf[val->value.str.len] = '\0';
|
|
return buf;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_add_to_info */
|
|
static void php3i_add_to_info(xml_parser *parser,char *name)
|
|
{
|
|
pval **element, *values;
|
|
|
|
if (! parser->info) {
|
|
return;
|
|
}
|
|
|
|
if (zend_hash_find(parser->info->value.ht,name,strlen(name) + 1,(void **) &element) == FAILURE) {
|
|
values = emalloc(sizeof(pval));
|
|
if (array_init(values) == FAILURE) {
|
|
php_error(E_ERROR, "Unable to initialize array");
|
|
return;
|
|
}
|
|
|
|
INIT_PZVAL(values);
|
|
|
|
zend_hash_update(parser->info->value.ht, name, strlen(name)+1, (void *) &values, sizeof(pval*), (void **) &element);
|
|
}
|
|
|
|
add_next_index_long(*element,parser->curtag);
|
|
|
|
parser->curtag++;
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xml_startElementHandler() */
|
|
|
|
void php3i_xml_startElementHandler(void *userData, const char *name,
|
|
const char **attributes)
|
|
{
|
|
xml_parser *parser = (xml_parser *)userData;
|
|
const char **attrs = attributes;
|
|
|
|
if (parser) {
|
|
pval *retval, *args[3];
|
|
|
|
parser->level++;
|
|
|
|
if (parser->case_folding) {
|
|
name = _php3_strtoupper(estrdup(name));
|
|
}
|
|
|
|
if (parser->startElementHandler) {
|
|
args[0] = php3i_long_pval(parser->index);
|
|
args[1] = php3i_string_pval(name);
|
|
MAKE_STD_ZVAL(args[2]);
|
|
array_init(args[2]);
|
|
while (attributes && *attributes) {
|
|
char *key = (char *)attributes[0];
|
|
char *value = (char *)attributes[1];
|
|
char *decoded_value;
|
|
int decoded_len;
|
|
if (parser->case_folding) {
|
|
key = _php3_strtoupper(estrdup(key));
|
|
}
|
|
decoded_value = xml_utf8_decode(value, strlen(value),
|
|
&decoded_len,
|
|
parser->target_encoding);
|
|
|
|
add_assoc_stringl(args[2], key, decoded_value, decoded_len, 0);
|
|
if (parser->case_folding) {
|
|
efree(key);
|
|
}
|
|
attributes += 2;
|
|
}
|
|
|
|
if ((retval = xml_call_handler(parser, parser->startElementHandler, 3, args))) {
|
|
zval_dtor(retval);
|
|
efree(retval);
|
|
}
|
|
}
|
|
|
|
if (parser->data) {
|
|
pval *tag, *atr;
|
|
int atcnt = 0;
|
|
|
|
tag = emalloc(sizeof(pval));
|
|
INIT_PZVAL(tag);
|
|
|
|
atr = emalloc(sizeof(pval));
|
|
INIT_PZVAL(atr);
|
|
|
|
array_init(tag);
|
|
array_init(atr);
|
|
|
|
php3i_add_to_info(parser,((char *) name) + parser->toffset);
|
|
|
|
add_assoc_string(tag,"tag",((char *) name) + parser->toffset,1); /* cast to avoid gcc-warning */
|
|
add_assoc_string(tag,"type","open",1);
|
|
add_assoc_long(tag,"level",parser->level);
|
|
|
|
parser->ltags[parser->level-1] = estrdup(name);
|
|
parser->lastwasopen = 1;
|
|
|
|
attributes = attrs;
|
|
while (attributes && *attributes) {
|
|
char *key = (char *)attributes[0];
|
|
char *value = (char *)attributes[1];
|
|
char *decoded_value;
|
|
int decoded_len;
|
|
if (parser->case_folding) {
|
|
key = _php3_strtoupper(estrdup(key));
|
|
}
|
|
decoded_value = xml_utf8_decode(value, strlen(value),
|
|
&decoded_len,
|
|
parser->target_encoding);
|
|
|
|
add_assoc_stringl(atr,key,decoded_value,decoded_len,0);
|
|
atcnt++;
|
|
if (parser->case_folding) {
|
|
efree(key);
|
|
}
|
|
attributes += 2;
|
|
}
|
|
|
|
if (atcnt) {
|
|
zend_hash_add(tag->value.ht,"attributes",sizeof("attributes"),&atr,sizeof(pval*),NULL);
|
|
} else {
|
|
zval_dtor(atr);
|
|
efree(atr);
|
|
}
|
|
|
|
zend_hash_next_index_insert(parser->data->value.ht,&tag,sizeof(pval*),(void *) &parser->ctag);
|
|
}
|
|
|
|
if (parser->case_folding) {
|
|
efree((char *)name);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xml_endElementHandler() */
|
|
|
|
void php3i_xml_endElementHandler(void *userData, const char *name)
|
|
{
|
|
xml_parser *parser = (xml_parser *)userData;
|
|
|
|
if (parser) {
|
|
pval *retval, *args[2];
|
|
|
|
if (parser->case_folding) {
|
|
name = _php3_strtoupper(estrdup(name));
|
|
}
|
|
|
|
if (parser->endElementHandler) {
|
|
args[0] = php3i_long_pval(parser->index);
|
|
args[1] = php3i_string_pval(name);
|
|
|
|
if ((retval = xml_call_handler(parser, parser->endElementHandler, 2, args))) {
|
|
zval_dtor(retval);
|
|
efree(retval);
|
|
}
|
|
}
|
|
|
|
if (parser->data) {
|
|
pval *tag;
|
|
|
|
if (parser->lastwasopen) {
|
|
add_assoc_string(*(parser->ctag),"type","complete",1);
|
|
} else {
|
|
tag = emalloc(sizeof(pval));
|
|
|
|
array_init(tag);
|
|
INIT_PZVAL(tag);
|
|
|
|
php3i_add_to_info(parser,((char *) name) + parser->toffset);
|
|
|
|
add_assoc_string(tag,"tag",((char *) name) + parser->toffset,1); /* cast to avoid gcc-warning */
|
|
add_assoc_string(tag,"type","close",1);
|
|
add_assoc_long(tag,"level",parser->level);
|
|
|
|
zend_hash_next_index_insert(parser->data->value.ht,&tag,sizeof(pval*),NULL);
|
|
}
|
|
|
|
parser->lastwasopen = 0;
|
|
}
|
|
|
|
if (parser->case_folding) {
|
|
efree((char *)name);
|
|
}
|
|
if (parser->ltags) {
|
|
efree(parser->ltags[parser->level-1]);
|
|
}
|
|
parser->level--;
|
|
}
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xml_characterDataHandler() */
|
|
|
|
void php3i_xml_characterDataHandler(void *userData, const XML_Char *s, int len)
|
|
{
|
|
xml_parser *parser = (xml_parser *)userData;
|
|
|
|
if (parser) {
|
|
pval *retval, *args[2];
|
|
|
|
if (parser->characterDataHandler) {
|
|
args[0] = php3i_long_pval(parser->index);
|
|
args[1] = php3i_xmlcharpval(s, len, parser->target_encoding);
|
|
if ((retval = xml_call_handler(parser, parser->characterDataHandler, 2, args))) {
|
|
zval_dtor(retval);
|
|
efree(retval);
|
|
}
|
|
}
|
|
|
|
if (parser->data) {
|
|
int i;
|
|
int doprint = 0;
|
|
|
|
char *decoded_value;
|
|
int decoded_len;
|
|
|
|
decoded_value = xml_utf8_decode(s,len,&decoded_len,parser->target_encoding);
|
|
for (i = 0; i < decoded_len; i++) {
|
|
switch (decoded_value[i]) {
|
|
case ' ':
|
|
case '\t':
|
|
case '\n':
|
|
continue;
|
|
default:
|
|
doprint = 1;
|
|
break;
|
|
}
|
|
if (doprint) {
|
|
break;
|
|
}
|
|
}
|
|
if (doprint || (! parser->skipwhite)) {
|
|
if (parser->lastwasopen) {
|
|
add_assoc_string(*(parser->ctag),"value",decoded_value,0);
|
|
} else {
|
|
pval *tag;
|
|
|
|
tag = emalloc(sizeof(pval));
|
|
|
|
array_init(tag);
|
|
|
|
php3i_add_to_info(parser,parser->ltags[parser->level-1] + parser->toffset);
|
|
|
|
add_assoc_string(tag,"tag",parser->ltags[parser->level-1] + parser->toffset,1);
|
|
add_assoc_string(tag,"value",decoded_value,0);
|
|
add_assoc_string(tag,"type","cdata",1);
|
|
add_assoc_long(tag,"level",parser->level);
|
|
|
|
zend_hash_next_index_insert(parser->data->value.ht,&tag,sizeof(pval*),NULL);
|
|
}
|
|
} else {
|
|
efree(decoded_value);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xml_processingInstructionHandler() */
|
|
|
|
void php3i_xml_processingInstructionHandler(void *userData,
|
|
const XML_Char *target,
|
|
const XML_Char *data)
|
|
{
|
|
xml_parser *parser = (xml_parser *)userData;
|
|
|
|
if (parser && parser->processingInstructionHandler) {
|
|
pval *retval, *args[3];
|
|
|
|
args[0] = php3i_long_pval(parser->index);
|
|
args[1] = php3i_xmlcharpval(target, 0, parser->target_encoding);
|
|
args[2] = php3i_xmlcharpval(data, 0, parser->target_encoding);
|
|
if ((retval = xml_call_handler(parser, parser->processingInstructionHandler, 3, args))) {
|
|
zval_dtor(retval);
|
|
efree(retval);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xml_defaultHandler() */
|
|
|
|
void php3i_xml_defaultHandler(void *userData, const XML_Char *s, int len)
|
|
{
|
|
xml_parser *parser = (xml_parser *)userData;
|
|
|
|
if (parser && parser->defaultHandler) {
|
|
pval *retval, *args[2];
|
|
|
|
args[0] = php3i_long_pval(parser->index);
|
|
args[1] = php3i_xmlcharpval(s, len, parser->target_encoding);
|
|
if ((retval = xml_call_handler(parser, parser->defaultHandler, 2, args))) {
|
|
zval_dtor(retval);
|
|
efree(retval);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xml_unparsedEntityDeclHandler() */
|
|
|
|
void php3i_xml_unparsedEntityDeclHandler(void *userData,
|
|
const XML_Char *entityName,
|
|
const XML_Char *base,
|
|
const XML_Char *systemId,
|
|
const XML_Char *publicId,
|
|
const XML_Char *notationName)
|
|
{
|
|
xml_parser *parser = (xml_parser *)userData;
|
|
|
|
if (parser && parser->unparsedEntityDeclHandler) {
|
|
pval *retval, *args[5];
|
|
|
|
args[0] = php3i_long_pval(parser->index);
|
|
args[1] = php3i_xmlcharpval(entityName, 0, parser->target_encoding);
|
|
args[2] = php3i_xmlcharpval(base, 0, parser->target_encoding);
|
|
args[3] = php3i_xmlcharpval(systemId, 0, parser->target_encoding);
|
|
args[4] = php3i_xmlcharpval(publicId, 0, parser->target_encoding);
|
|
args[5] = php3i_xmlcharpval(notationName, 0, parser->target_encoding);
|
|
if ((retval = xml_call_handler(parser, parser->unparsedEntityDeclHandler, 6, args))) {
|
|
zval_dtor(retval);
|
|
efree(retval);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xml_notationDeclHandler() */
|
|
|
|
void
|
|
php3i_xml_notationDeclHandler(void *userData,
|
|
const XML_Char *notationName,
|
|
const XML_Char *base,
|
|
const XML_Char *systemId,
|
|
const XML_Char *publicId)
|
|
{
|
|
xml_parser *parser = (xml_parser *)userData;
|
|
|
|
if (parser && parser->notationDeclHandler) {
|
|
pval *retval, *args[5];
|
|
|
|
args[0] = php3i_long_pval(parser->index);
|
|
args[1] = php3i_xmlcharpval(notationName, 0, parser->target_encoding);
|
|
args[2] = php3i_xmlcharpval(base, 0, parser->target_encoding);
|
|
args[3] = php3i_xmlcharpval(systemId, 0, parser->target_encoding);
|
|
args[4] = php3i_xmlcharpval(publicId, 0, parser->target_encoding);
|
|
if ((retval = xml_call_handler(parser, parser->notationDeclHandler, 5, args))) {
|
|
zval_dtor(retval);
|
|
efree(retval);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ php3i_xml_externalEntityRefHandler() */
|
|
|
|
int
|
|
php3i_xml_externalEntityRefHandler(XML_Parser parserPtr,
|
|
const XML_Char *openEntityNames,
|
|
const XML_Char *base,
|
|
const XML_Char *systemId,
|
|
const XML_Char *publicId)
|
|
{
|
|
xml_parser *parser = XML_GetUserData(parserPtr);
|
|
int ret = 0; /* abort if no handler is set (should be configurable?) */
|
|
|
|
if (parser && parser->externalEntityRefHandler) {
|
|
pval *retval, *args[5];
|
|
|
|
args[0] = php3i_long_pval(parser->index);
|
|
args[1] = php3i_xmlcharpval(openEntityNames, 0, parser->target_encoding);
|
|
args[2] = php3i_xmlcharpval(base, 0, parser->target_encoding);
|
|
args[3] = php3i_xmlcharpval(systemId, 0, parser->target_encoding);
|
|
args[4] = php3i_xmlcharpval(publicId, 0, parser->target_encoding);
|
|
if ((retval = xml_call_handler(parser, parser->externalEntityRefHandler, 5, args))) {
|
|
convert_to_long(retval);
|
|
ret = retval->value.lval;
|
|
efree(retval);
|
|
} else {
|
|
ret = 0;
|
|
}
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
/* }}} */
|
|
|
|
/* }}} */
|
|
|
|
/************************* EXTENSION FUNCTIONS *************************/
|
|
|
|
/* {{{ proto int xml_parser_create()
|
|
Create an XML parser */
|
|
PHP_FUNCTION(xml_parser_create)
|
|
{
|
|
xml_parser *parser;
|
|
int argc;
|
|
pval *encodingArg = NULL;
|
|
XML_Char *encoding;
|
|
char thisfunc[] = "xml_parser_create";
|
|
XMLLS_FETCH();
|
|
|
|
argc = ARG_COUNT(ht);
|
|
|
|
if (argc > 1 || getParameters(ht, argc, &encodingArg) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
|
|
if (argc == 1) {
|
|
convert_to_string(encodingArg);
|
|
/* The supported encoding types are hardcoded here because
|
|
* we are limited to the encodings supported by expat/xmltok.
|
|
*/
|
|
if (strncasecmp(encodingArg->value.str.val, "ISO-8859-1",
|
|
encodingArg->value.str.len) == 0) {
|
|
encoding = "ISO-8859-1";
|
|
} else if (strncasecmp(encodingArg->value.str.val, "UTF-8",
|
|
encodingArg->value.str.len) == 0) {
|
|
encoding = "UTF-8";
|
|
} else if (strncasecmp(encodingArg->value.str.val, "US-ASCII",
|
|
encodingArg->value.str.len) == 0) {
|
|
encoding = "US-ASCII";
|
|
} else { /* UTF-16 not supported */
|
|
php_error(E_WARNING, "%s: unsupported source encoding \"%s\"",
|
|
thisfunc, encodingArg->value.str.val);
|
|
RETURN_FALSE;
|
|
}
|
|
} else {
|
|
encoding = XML(default_encoding);
|
|
}
|
|
|
|
parser = ecalloc(sizeof(xml_parser), 1);
|
|
parser->parser = XML_ParserCreate(encoding);
|
|
parser->target_encoding = encoding;
|
|
parser->case_folding = 1;
|
|
XML_SetUserData(parser->parser, parser);
|
|
|
|
ZEND_REGISTER_RESOURCE(return_value,parser,le_xml_parser);
|
|
parser->index = return_value->value.lval;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_set_element_handler(int pind, string shdl, string ehdl)
|
|
Set up start and end element handlers */
|
|
PHP_FUNCTION(xml_set_element_handler)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *shdl, *ehdl;
|
|
|
|
if (ARG_COUNT(ht) != 3 ||
|
|
getParameters(ht, 3, &pind, &shdl, &ehdl) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(shdl);
|
|
convert_to_string(ehdl);
|
|
|
|
xml_set_handler(&parser->startElementHandler, shdl);
|
|
xml_set_handler(&parser->endElementHandler, ehdl);
|
|
XML_SetElementHandler(parser->parser, php3i_xml_startElementHandler, php3i_xml_endElementHandler);
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_set_character_data_handler(int pind, string hdl)
|
|
Set up character data handler */
|
|
PHP_FUNCTION(xml_set_character_data_handler)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *hdl;
|
|
|
|
if (ARG_COUNT(ht) != 2 || getParameters(ht, 2, &pind, &hdl) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(hdl);
|
|
|
|
xml_set_handler(&parser->characterDataHandler, hdl);
|
|
XML_SetCharacterDataHandler(parser->parser, php3i_xml_characterDataHandler);
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_set_processing_instruction_handler(int pind, string hdl)
|
|
Set up processing instruction (PI) handler */
|
|
PHP_FUNCTION(xml_set_processing_instruction_handler)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *hdl;
|
|
|
|
if (ARG_COUNT(ht) != 2 || getParameters(ht, 2, &pind, &hdl) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(hdl);
|
|
|
|
xml_set_handler(&parser->processingInstructionHandler, hdl);
|
|
XML_SetProcessingInstructionHandler(parser->parser, php3i_xml_processingInstructionHandler);
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_set_default_handler(int pind, string hdl)
|
|
Set up default handler */
|
|
PHP_FUNCTION(xml_set_default_handler)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *hdl;
|
|
|
|
if (ARG_COUNT(ht) != 2 || getParameters(ht, 2, &pind, &hdl) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(hdl);
|
|
|
|
xml_set_handler(&parser->defaultHandler, hdl);
|
|
XML_SetDefaultHandler(parser->parser, php3i_xml_defaultHandler);
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_set_unparsed_entity_decl_handler(int pind, string hdl)
|
|
Set up unparsed entity declaration handler */
|
|
PHP_FUNCTION(xml_set_unparsed_entity_decl_handler)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *hdl;
|
|
|
|
if (ARG_COUNT(ht) != 2 || getParameters(ht, 2, &pind, &hdl) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(hdl);
|
|
|
|
xml_set_handler(&parser->unparsedEntityDeclHandler, hdl);
|
|
XML_SetUnparsedEntityDeclHandler(parser->parser, php3i_xml_unparsedEntityDeclHandler);
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_set_notation_decl_handler(int pind, string hdl)
|
|
Set up notation declaration handler */
|
|
PHP_FUNCTION(xml_set_notation_decl_handler)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *hdl;
|
|
|
|
if (ARG_COUNT(ht) != 2 || getParameters(ht, 2, &pind, &hdl) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(hdl);
|
|
|
|
xml_set_handler(&parser->notationDeclHandler, hdl);
|
|
XML_SetNotationDeclHandler(parser->parser, php3i_xml_notationDeclHandler);
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_set_external_entity_ref_handler(int pind, string hdl)
|
|
Set up external entity reference handler */
|
|
PHP_FUNCTION(xml_set_external_entity_ref_handler)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *hdl;
|
|
|
|
if (ARG_COUNT(ht) != 2 || getParameters(ht, 2, &pind, &hdl) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(hdl);
|
|
|
|
xml_set_handler(&parser->externalEntityRefHandler, hdl);
|
|
XML_SetExternalEntityRefHandler(parser->parser, php3i_xml_externalEntityRefHandler);
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_parse(int pind, string data[, int isFinal])
|
|
Start parsing an XML document */
|
|
PHP_FUNCTION(xml_parse)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *data, *final;
|
|
int argc, isFinal, ret;
|
|
|
|
argc = ARG_COUNT(ht);
|
|
if (argc < 2 || argc > 3 || getParameters(ht, argc, &pind, &data, &final) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(data);
|
|
|
|
if (argc == 3) {
|
|
convert_to_long(final);
|
|
isFinal = final->value.lval;
|
|
} else {
|
|
isFinal = 0;
|
|
}
|
|
|
|
ret = XML_Parse(parser->parser, data->value.str.val, data->value.str.len, isFinal);
|
|
RETVAL_LONG(ret);
|
|
}
|
|
|
|
/* }}} */
|
|
/* {{{ proto int xml_parse_into_struct(int pind, string data,array &struct,array &index)
|
|
Parsing a XML document */
|
|
|
|
PHP_FUNCTION(xml_parse_into_struct)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *data, *xdata,*info = 0;
|
|
int argc, ret;
|
|
|
|
argc = ARG_COUNT(ht);
|
|
if (getParameters(ht, 4, &pind, &data, &xdata,&info) == SUCCESS) {
|
|
if (!ParameterPassedByReference(ht, 4)) {
|
|
php_error(E_WARNING, "Array to be filled with values must be passed by reference.");
|
|
RETURN_FALSE;
|
|
}
|
|
array_init(info);
|
|
} else if (getParameters(ht, 3, &pind, &data, &xdata) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
|
|
if (!ParameterPassedByReference(ht, 3)) {
|
|
php_error(E_WARNING, "Array to be filled with values must be passed by reference.");
|
|
RETURN_FALSE;
|
|
}
|
|
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_string(data);
|
|
array_init(xdata);
|
|
|
|
parser->data = xdata;
|
|
parser->info = info;
|
|
parser->level = 0;
|
|
parser->ltags = emalloc(XML_MAXLEVEL * sizeof(char *));
|
|
|
|
XML_SetDefaultHandler(parser->parser, php3i_xml_defaultHandler);
|
|
XML_SetElementHandler(parser->parser, php3i_xml_startElementHandler, php3i_xml_endElementHandler);
|
|
XML_SetCharacterDataHandler(parser->parser, php3i_xml_characterDataHandler);
|
|
|
|
ret = XML_Parse(parser->parser, data->value.str.val, data->value.str.len, 1);
|
|
|
|
RETVAL_LONG(ret);
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_get_error_code(int pind)
|
|
Get XML parser error code */
|
|
PHP_FUNCTION(xml_get_error_code)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind;
|
|
|
|
if (ARG_COUNT(ht) != 1 || getParameters(ht, 1, &pind) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
RETVAL_LONG((long)XML_GetErrorCode(parser->parser));
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto string xml_error_string(int code)
|
|
Get XML parser error string */
|
|
PHP_FUNCTION(xml_error_string)
|
|
{
|
|
pval *code;
|
|
char *str;
|
|
|
|
if (ARG_COUNT(ht) != 1 || getParameters(ht, 1, &code) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
convert_to_long(code);
|
|
str = (char *)XML_ErrorString((int)code->value.lval);
|
|
if (str) {
|
|
RETVAL_STRING(str, 1);
|
|
}
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_get_current_line_number(int pind)
|
|
Get current line number for an XML parser */
|
|
PHP_FUNCTION(xml_get_current_line_number)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind;
|
|
|
|
if (ARG_COUNT(ht) != 1 || getParameters(ht, 1, &pind) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
RETVAL_LONG(XML_GetCurrentLineNumber(parser->parser));
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_get_current_column_number(int pind)
|
|
Get current column number for an XML parser
|
|
*/
|
|
PHP_FUNCTION(xml_get_current_column_number)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind;
|
|
|
|
if (ARG_COUNT(ht) != 1 || getParameters(ht, 1, &pind) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
RETVAL_LONG(XML_GetCurrentColumnNumber(parser->parser));
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_get_current_byte_index(int pind)
|
|
Get current byte index for an XML parser */
|
|
PHP_FUNCTION(xml_get_current_byte_index)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind;
|
|
|
|
if (ARG_COUNT(ht) != 1 || getParameters(ht, 1, &pind) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
RETVAL_LONG(XML_GetCurrentByteIndex(parser->parser));
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_parser_free(int pind)
|
|
Free an XML parser */
|
|
PHP_FUNCTION(xml_parser_free)
|
|
{
|
|
pval *pind;
|
|
xml_parser *parser;
|
|
|
|
if (ARG_COUNT(ht) != 1 || getParameters(ht, 1, &pind) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
if (php3_list_delete(parser->index) == FAILURE) {
|
|
RETURN_FALSE;
|
|
}
|
|
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_parser_set_option(int pind, int option, mixed value)
|
|
Set options in an XML parser */
|
|
PHP_FUNCTION(xml_parser_set_option)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *opt, *val;
|
|
char thisfunc[] = "xml_parser_set_option";
|
|
|
|
if (ARG_COUNT(ht) != 3 || getParameters(ht, 3, &pind, &opt, &val) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_long(opt);
|
|
|
|
switch (opt->value.lval) {
|
|
case PHP3_XML_OPTION_CASE_FOLDING:
|
|
convert_to_long(val);
|
|
parser->case_folding = val->value.lval;
|
|
break;
|
|
case PHP3_XML_OPTION_SKIP_TAGSTART:
|
|
convert_to_long(val);
|
|
parser->toffset = val->value.lval;
|
|
break;
|
|
case PHP3_XML_OPTION_SKIP_WHITE:
|
|
convert_to_long(val);
|
|
parser->skipwhite = val->value.lval;
|
|
break;
|
|
case PHP3_XML_OPTION_TARGET_ENCODING: {
|
|
xml_encoding *enc = xml_get_encoding(val->value.str.val);
|
|
if (enc == NULL) {
|
|
php_error(E_WARNING, "%s: unsupported target encoding \"%s\"",
|
|
thisfunc, val->value.str.val);
|
|
RETURN_FALSE;
|
|
}
|
|
parser->target_encoding = enc->name;
|
|
break;
|
|
}
|
|
default:
|
|
php_error(E_WARNING, "%s: unknown option", thisfunc);
|
|
RETURN_FALSE;
|
|
break;
|
|
}
|
|
RETVAL_TRUE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto int xml_parser_get_option(int pind, int option)
|
|
Get options from an XML parser */
|
|
PHP_FUNCTION(xml_parser_get_option)
|
|
{
|
|
xml_parser *parser;
|
|
pval *pind, *opt;
|
|
char thisfunc[] = "xml_parser_get_option";
|
|
|
|
if (ARG_COUNT(ht) != 2 || getParameters(ht, 2, &pind, &opt) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
|
|
|
|
convert_to_long(opt);
|
|
|
|
switch (opt->value.lval) {
|
|
case PHP3_XML_OPTION_CASE_FOLDING:
|
|
RETURN_LONG(parser->case_folding);
|
|
break;
|
|
case PHP3_XML_OPTION_TARGET_ENCODING:
|
|
RETURN_STRING(parser->target_encoding, 1);
|
|
break;
|
|
default:
|
|
php_error(E_WARNING, "%s: unknown option", thisfunc);
|
|
RETURN_FALSE;
|
|
break;
|
|
}
|
|
RETVAL_FALSE;
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto string utf8_encode(string data)
|
|
Encodes an ISO-8859-1 string to UTF-8 */
|
|
PHP_FUNCTION(utf8_encode)
|
|
{
|
|
pval *arg;
|
|
XML_Char *encoded;
|
|
int len;
|
|
|
|
if (ARG_COUNT(ht) != 1 || getParameters(ht, 1, &arg) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
convert_to_string(arg);
|
|
encoded = xml_utf8_encode(arg->value.str.val, arg->value.str.len, &len, "ISO-8859-1");
|
|
if (encoded == NULL) {
|
|
RETURN_FALSE;
|
|
}
|
|
RETVAL_STRINGL(encoded, len, 0);
|
|
}
|
|
/* }}} */
|
|
|
|
/* {{{ proto string utf8_decode(string data)
|
|
Converts a UTF-8 encoded string to ISO-8859-1 */
|
|
PHP_FUNCTION(utf8_decode)
|
|
{
|
|
pval *arg;
|
|
XML_Char *decoded;
|
|
int len;
|
|
|
|
if (ARG_COUNT(ht) != 1 || getParameters(ht, 1, &arg) == FAILURE) {
|
|
WRONG_PARAM_COUNT;
|
|
}
|
|
convert_to_string(arg);
|
|
decoded = xml_utf8_decode(arg->value.str.val, arg->value.str.len, &len, "ISO-8859-1");
|
|
if (decoded == NULL) {
|
|
RETURN_FALSE;
|
|
}
|
|
RETVAL_STRINGL(decoded, len, 0);
|
|
}
|
|
/* }}} */
|
|
|
|
#endif
|
|
|
|
/*
|
|
* Local variables:
|
|
* tab-width: 4
|
|
* c-basic-offset: 4
|
|
* End:
|
|
*/
|