1999-04-08 02:10:10 +08:00
|
|
|
/*
|
|
|
|
+----------------------------------------------------------------------+
|
|
|
|
| Zend Engine |
|
|
|
|
+----------------------------------------------------------------------+
|
2019-01-30 17:23:29 +08:00
|
|
|
| Copyright (c) Zend Technologies Ltd. (http://www.zend.com) |
|
1999-04-08 02:10:10 +08:00
|
|
|
+----------------------------------------------------------------------+
|
2001-12-11 23:16:21 +08:00
|
|
|
| This source file is subject to version 2.00 of the Zend license, |
|
2015-01-03 17:22:58 +08:00
|
|
|
| that is bundled with this package in the file LICENSE, and is |
|
2003-06-11 04:04:29 +08:00
|
|
|
| available through the world-wide-web at the following url: |
|
2001-12-11 23:16:21 +08:00
|
|
|
| http://www.zend.com/license/2_00.txt. |
|
1999-07-16 22:58:16 +08:00
|
|
|
| If you did not receive a copy of the Zend license and are unable to |
|
|
|
|
| obtain it through the world-wide-web, please send a note to |
|
|
|
|
| license@zend.com so we can mail you a copy immediately. |
|
1999-04-08 02:10:10 +08:00
|
|
|
+----------------------------------------------------------------------+
|
2018-11-01 23:20:07 +08:00
|
|
|
| Authors: Andi Gutmans <andi@php.net> |
|
|
|
|
| Zeev Suraski <zeev@php.net> |
|
1999-04-08 02:10:10 +08:00
|
|
|
+----------------------------------------------------------------------+
|
|
|
|
*/
|
|
|
|
|
2000-07-03 08:55:36 +08:00
|
|
|
#ifndef ZEND_SCANNER_H
|
|
|
|
#define ZEND_SCANNER_H
|
1999-04-08 02:10:10 +08:00
|
|
|
|
1999-05-23 00:10:51 +08:00
|
|
|
typedef struct _zend_lex_state {
|
2008-03-17 05:06:55 +08:00
|
|
|
unsigned int yy_leng;
|
|
|
|
unsigned char *yy_start;
|
|
|
|
unsigned char *yy_text;
|
|
|
|
unsigned char *yy_cursor;
|
|
|
|
unsigned char *yy_marker;
|
|
|
|
unsigned char *yy_limit;
|
|
|
|
int yy_state;
|
|
|
|
zend_stack state_stack;
|
2012-03-31 02:41:44 +08:00
|
|
|
zend_ptr_stack heredoc_label_stack;
|
Syntax errors caused by unclosed {, [, ( mention specific location
Aside from a few very specific syntax errors for which detailed exceptions are
thrown, generally PHP just emits the default error messages generated by bison on syntax
error. These messages are very uninformative; they just say "Unexpected ... at line ...".
This is most problematic with constructs which can span an arbitrary number of lines, such
as blocks of code delimited by { }, 'if' conditions delimited by ( ), and so on. If a closing
delimiter is missed, the block will run for the entire remainder of the source file (which
could be thousands of lines), and then at the end, a parse error will be thrown with the
dreaded words: "Unexpected end of file".
Therefore, track the positions of opening and closing delimiters and ensure that they match
up correctly. If any mismatch or missing delimiter is detected, immediately throw a parse
error which points the user to the offending line. This is best done in the *lexer* and not
in the parser.
Thanks to Nikita Popov and George Peter Banyard for suggesting improvements.
Fixes bug #79368.
Closes GH-5364.
2020-04-08 19:19:39 +08:00
|
|
|
zend_stack nest_location_stack; /* for syntax error reporting */
|
2008-03-17 05:06:55 +08:00
|
|
|
|
2003-02-18 17:37:54 +08:00
|
|
|
zend_file_handle *in;
|
2016-11-26 22:18:42 +08:00
|
|
|
uint32_t lineno;
|
2014-02-10 14:04:30 +08:00
|
|
|
zend_string *filename;
|
2008-06-29 16:21:35 +08:00
|
|
|
|
|
|
|
/* original (unfiltered) script */
|
2008-07-25 06:21:41 +08:00
|
|
|
unsigned char *script_org;
|
|
|
|
size_t script_org_size;
|
2008-06-29 16:21:35 +08:00
|
|
|
|
|
|
|
/* filtered script */
|
2008-07-25 06:21:41 +08:00
|
|
|
unsigned char *script_filtered;
|
|
|
|
size_t script_filtered_size;
|
2008-06-29 16:21:35 +08:00
|
|
|
|
2013-07-24 07:55:43 +08:00
|
|
|
/* input/output filters */
|
2008-06-29 16:21:35 +08:00
|
|
|
zend_encoding_filter input_filter;
|
|
|
|
zend_encoding_filter output_filter;
|
2010-12-20 00:36:37 +08:00
|
|
|
const zend_encoding *script_encoding;
|
2015-01-23 01:39:34 +08:00
|
|
|
|
2015-04-05 19:50:35 +08:00
|
|
|
/* hooks */
|
2020-06-05 22:55:20 +08:00
|
|
|
void (*on_event)(
|
|
|
|
zend_php_scanner_event event, int token, int line,
|
|
|
|
const char *text, size_t length, void *context);
|
2016-07-23 06:00:13 +08:00
|
|
|
void *on_event_context;
|
2015-04-05 19:50:35 +08:00
|
|
|
|
2015-01-23 01:39:34 +08:00
|
|
|
zend_ast *ast;
|
|
|
|
zend_arena *ast_arena;
|
2000-06-17 22:12:58 +08:00
|
|
|
} zend_lex_state;
|
|
|
|
|
2012-03-31 02:41:44 +08:00
|
|
|
typedef struct _zend_heredoc_label {
|
|
|
|
char *label;
|
|
|
|
int length;
|
2017-09-15 21:07:59 +08:00
|
|
|
int indentation;
|
2021-01-15 19:30:54 +08:00
|
|
|
bool indentation_uses_spaces;
|
2012-03-31 02:41:44 +08:00
|
|
|
} zend_heredoc_label;
|
1999-04-08 02:10:10 +08:00
|
|
|
|
Syntax errors caused by unclosed {, [, ( mention specific location
Aside from a few very specific syntax errors for which detailed exceptions are
thrown, generally PHP just emits the default error messages generated by bison on syntax
error. These messages are very uninformative; they just say "Unexpected ... at line ...".
This is most problematic with constructs which can span an arbitrary number of lines, such
as blocks of code delimited by { }, 'if' conditions delimited by ( ), and so on. If a closing
delimiter is missed, the block will run for the entire remainder of the source file (which
could be thousands of lines), and then at the end, a parse error will be thrown with the
dreaded words: "Unexpected end of file".
Therefore, track the positions of opening and closing delimiters and ensure that they match
up correctly. If any mismatch or missing delimiter is detected, immediately throw a parse
error which points the user to the offending line. This is best done in the *lexer* and not
in the parser.
Thanks to Nikita Popov and George Peter Banyard for suggesting improvements.
Fixes bug #79368.
Closes GH-5364.
2020-04-08 19:19:39 +08:00
|
|
|
/* Track locations of unclosed {, [, (, etc. for better syntax error reporting */
|
|
|
|
typedef struct _zend_nest_location {
|
|
|
|
char text;
|
|
|
|
int lineno;
|
|
|
|
} zend_nest_location;
|
|
|
|
|
1999-12-03 02:59:29 +08:00
|
|
|
BEGIN_EXTERN_C()
|
2014-12-14 06:06:14 +08:00
|
|
|
ZEND_API void zend_save_lexical_state(zend_lex_state *lex_state);
|
|
|
|
ZEND_API void zend_restore_lexical_state(zend_lex_state *lex_state);
|
2021-01-21 17:31:32 +08:00
|
|
|
ZEND_API void zend_prepare_string_for_scanning(zval *str, zend_string *filename);
|
2014-12-14 06:06:14 +08:00
|
|
|
ZEND_API void zend_multibyte_yyinput_again(zend_encoding_filter old_input_filter, const zend_encoding *old_encoding);
|
2020-08-28 21:41:27 +08:00
|
|
|
ZEND_API zend_result zend_multibyte_set_filter(const zend_encoding *onetime_encoding);
|
2021-01-25 21:36:18 +08:00
|
|
|
ZEND_API zend_result zend_lex_tstring(zval *zv, unsigned char *ident);
|
2004-01-12 03:27:13 +08:00
|
|
|
|
1999-12-03 02:59:29 +08:00
|
|
|
END_EXTERN_C()
|
1999-12-02 06:55:20 +08:00
|
|
|
|
1999-04-08 02:10:10 +08:00
|
|
|
#endif
|