mirror of
https://github.com/jerryscript-project/jerryscript.git
synced 2025-12-15 16:29:21 +00:00
* Fix "end of file while inside a group" doxygen warnings. * Fix "unknown command" doxygen warnings caused by incorrect argument references. Instead of `@foo`, `@a foo` is the proper format. * Fix "unknown command" doxygen warnings caused by incorrect parameter direction specifications. Instead of `@in`, `@out`, and `@in-out`, `[in]`, `[out]`, and `[in,out]` are the proper formats. * Wrapping special characters in quotes to avoid doxygen confusion. Raw pipe, semicolon, dot, backslash, etc. characters can drive doxygen into various misinterpretations and warnings. E.g.: ``` End of list marker found without any preceding list items Found unknown command ``` Putting quotes around such text snipets eliminates the errors. * Fix the documentation of `ecma_builtin_global_object_print`. Raw <> and \ sequences confused doxygen in various ways (it tried to interpret them as XML tags and doxygen commands). * Fix "ignoring title that does not match old title" doxygen warnings. At some places, the group titles were out of sync, at others, the group names were incorrect. * Fix "parameters are not documented" doxygen warnings. Fixing various typos in the inline parameter documentations (`/*`, `/**`, `/** <`, and `/**>` are all considered incorrect, the right format is `/**<`). JerryScript-DCO-1.0-Signed-off-by: Akos Kiss akiss@inf.u-szeged.hu
131 lines
4.7 KiB
C
131 lines
4.7 KiB
C
/* Copyright 2015-2016 Samsung Electronics Co., Ltd.
|
|
* Copyright 2015-2016 University of Szeged.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#ifndef RE_COMPILER_H
|
|
#define RE_COMPILER_H
|
|
|
|
#ifndef CONFIG_ECMA_COMPACT_PROFILE_DISABLE_REGEXP_BUILTIN
|
|
|
|
#include "ecma-globals.h"
|
|
#include "re-parser.h"
|
|
|
|
/** \addtogroup parser Parser
|
|
* @{
|
|
*
|
|
* \addtogroup regexparser Regular expression
|
|
* @{
|
|
*
|
|
* \addtogroup regexparser_compiler Compiler
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* RegExp opcodes
|
|
*/
|
|
typedef enum
|
|
{
|
|
RE_OP_EOF,
|
|
/* Group opcode order is important, because RE_IS_CAPTURE_GROUP is based on it.
|
|
* Change it carefully. Capture opcodes should be at first.
|
|
*/
|
|
RE_OP_CAPTURE_GROUP_START, /**< group start */
|
|
RE_OP_CAPTURE_GREEDY_ZERO_GROUP_START, /**< greedy zero group start */
|
|
RE_OP_CAPTURE_NON_GREEDY_ZERO_GROUP_START, /**< non-greedy zero group start */
|
|
RE_OP_CAPTURE_GREEDY_GROUP_END, /**< greedy group end */
|
|
RE_OP_CAPTURE_NON_GREEDY_GROUP_END, /**< non-greedy group end */
|
|
RE_OP_NON_CAPTURE_GROUP_START, /**< non-capture group start */
|
|
RE_OP_NON_CAPTURE_GREEDY_ZERO_GROUP_START, /**< non-capture greedy zero group start */
|
|
RE_OP_NON_CAPTURE_NON_GREEDY_ZERO_GROUP_START, /**< non-capture non-greedy zero group start */
|
|
RE_OP_NON_CAPTURE_GREEDY_GROUP_END, /**< non-capture greedy group end */
|
|
RE_OP_NON_CAPTURE_NON_GREEDY_GROUP_END, /**< non-capture non-greedy group end */
|
|
|
|
RE_OP_MATCH, /**< match */
|
|
RE_OP_CHAR, /**< any character */
|
|
RE_OP_SAVE_AT_START, /**< save at start */
|
|
RE_OP_SAVE_AND_MATCH, /**< save and match */
|
|
RE_OP_PERIOD, /**< "." */
|
|
RE_OP_ALTERNATIVE, /**< "|" */
|
|
RE_OP_GREEDY_ITERATOR, /**< greedy iterator */
|
|
RE_OP_NON_GREEDY_ITERATOR, /**< non-greedy iterator */
|
|
RE_OP_ASSERT_START, /**< "^" */
|
|
RE_OP_ASSERT_END, /**< "$" */
|
|
RE_OP_ASSERT_WORD_BOUNDARY, /**< "\b" */
|
|
RE_OP_ASSERT_NOT_WORD_BOUNDARY, /**< "\B" */
|
|
RE_OP_LOOKAHEAD_POS, /**< lookahead pos */
|
|
RE_OP_LOOKAHEAD_NEG, /**< lookahead neg */
|
|
RE_OP_BACKREFERENCE, /**< \[0..9] */
|
|
RE_OP_CHAR_CLASS, /**< [ ] */
|
|
RE_OP_INV_CHAR_CLASS /**< [^ ] */
|
|
} re_opcode_t;
|
|
|
|
/**
|
|
* Compiled byte code data.
|
|
*/
|
|
typedef struct
|
|
{
|
|
uint16_t flags; /**< RegExp flags */
|
|
mem_cpointer_t pattern_cp; /**< original RegExp pattern */
|
|
uint32_t num_of_captures; /**< number of capturing brackets */
|
|
uint32_t num_of_non_captures; /**< number of non capturing brackets */
|
|
} re_compiled_code_t;
|
|
|
|
/**
|
|
* Check if a RegExp opcode is a capture group or not
|
|
*/
|
|
#define RE_IS_CAPTURE_GROUP(x) (((x) < RE_OP_NON_CAPTURE_GROUP_START) ? 1 : 0)
|
|
|
|
/**
|
|
* Context of RegExp bytecode container
|
|
*/
|
|
typedef struct
|
|
{
|
|
uint8_t *block_start_p; /**< start of bytecode block */
|
|
uint8_t *block_end_p; /**< end of bytecode block */
|
|
uint8_t *current_p; /**< current position in bytecode */
|
|
} re_bytecode_ctx_t;
|
|
|
|
/**
|
|
* Context of RegExp compiler
|
|
*/
|
|
typedef struct
|
|
{
|
|
uint16_t flags; /**< RegExp flags */
|
|
uint32_t num_of_captures; /**< number of capture groups */
|
|
uint32_t num_of_non_captures; /**< number of non-capture groups */
|
|
uint32_t highest_backref; /**< highest backreference */
|
|
re_bytecode_ctx_t *bytecode_ctx_p; /**< pointer of RegExp bytecode context */
|
|
re_token_t current_token; /**< current token */
|
|
re_parser_ctx_t *parser_ctx_p; /**< pointer of RegExp parser context */
|
|
} re_compiler_ctx_t;
|
|
|
|
ecma_completion_value_t
|
|
re_compile_bytecode (re_compiled_code_t **, ecma_string_t *, uint16_t);
|
|
|
|
re_opcode_t
|
|
re_get_opcode (uint8_t **);
|
|
|
|
uint32_t
|
|
re_get_value (uint8_t **);
|
|
|
|
/**
|
|
* @}
|
|
* @}
|
|
* @}
|
|
*/
|
|
|
|
#endif /* !CONFIG_ECMA_COMPACT_PROFILE_DISABLE_REGEXP_BUILTIN */
|
|
#endif /* !RE_COMPILER_H */
|