Improvements related to lexer

Improvements related to lexer:

* duplicated clone elimination
* magic numbers are replaced with constants
* functions are moved form util to lit-char-helpers

JerryScript-DCO-1.0-Signed-off-by: István Kádár ikadar@inf.u-szeged.hu
This commit is contained in:
Istvan Kadar
2016-04-14 10:26:36 +02:00
committed by Akos Kiss
parent c7dcce4fc7
commit ecfd478df0
9 changed files with 424 additions and 388 deletions
+141 -28
View File
@@ -122,7 +122,7 @@ lit_char_is_format_control (ecma_char_t c) /**< code unit */
bool bool
lit_char_is_white_space (ecma_char_t c) /**< code unit */ lit_char_is_white_space (ecma_char_t c) /**< code unit */
{ {
if (c <= 127) if (c <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
{ {
return (c == LIT_CHAR_TAB return (c == LIT_CHAR_TAB
|| c == LIT_CHAR_VTAB || c == LIT_CHAR_VTAB
@@ -172,20 +172,9 @@ lit_char_is_line_terminator (ecma_char_t c) /**< code unit */
* @return true - if specified character falls into one of the listed categories, * @return true - if specified character falls into one of the listed categories,
* false - otherwise. * false - otherwise.
*/ */
bool static bool
lit_char_is_unicode_letter (ecma_char_t c) /**< code unit */ lit_char_is_unicode_letter (ecma_char_t c) /**< code unit */
{ {
/* Fast path for ASCII-defined letters */
if ((c >= LIT_CHAR_ASCII_LOWERCASE_LETTERS_BEGIN && c <= LIT_CHAR_ASCII_LOWERCASE_LETTERS_END)
|| (c >= LIT_CHAR_ASCII_UPPERCASE_LETTERS_BEGIN && c <= LIT_CHAR_ASCII_UPPERCASE_LETTERS_END))
{
return true;
}
else if (c <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
{
return false;
}
return (search_char_in_interval_array (c, unicode_letter_interv_sps, unicode_letter_interv_lens, return (search_char_in_interval_array (c, unicode_letter_interv_sps, unicode_letter_interv_lens,
NUM_OF_ELEMENTS (unicode_letter_interv_sps)) NUM_OF_ELEMENTS (unicode_letter_interv_sps))
|| search_char_in_char_array (c, unicode_letter_chars, NUM_OF_ELEMENTS (unicode_letter_chars))); || search_char_in_char_array (c, unicode_letter_chars, NUM_OF_ELEMENTS (unicode_letter_chars)));
@@ -205,23 +194,90 @@ lit_char_is_unicode_letter (ecma_char_t c) /**< code unit */
* @return true - if specified character falls into one of the listed categories, * @return true - if specified character falls into one of the listed categories,
* false - otherwise. * false - otherwise.
*/ */
bool static bool
lit_char_is_unicode_non_letter_ident_part (ecma_char_t c) /**< code unit */ lit_char_is_unicode_non_letter_ident_part (ecma_char_t c) /**< code unit */
{ {
if (c <= 127) return (search_char_in_interval_array (c, unicode_non_letter_ident_part_interv_sps,
{ unicode_non_letter_ident_part_interv_lens,
return LIT_CHAR_ASCII_DIGITS_BEGIN <= c && c <= LIT_CHAR_ASCII_DIGITS_END; NUM_OF_ELEMENTS (unicode_non_letter_ident_part_interv_sps))
} || search_char_in_char_array (c, unicode_non_letter_ident_part_chars,
else NUM_OF_ELEMENTS (unicode_non_letter_ident_part_chars)));
{
return (search_char_in_interval_array (c, unicode_non_letter_ident_part_interv_sps,
unicode_non_letter_ident_part_interv_lens,
NUM_OF_ELEMENTS (unicode_non_letter_ident_part_interv_sps))
|| search_char_in_char_array (c, unicode_non_letter_ident_part_chars,
NUM_OF_ELEMENTS (unicode_non_letter_ident_part_chars)));
}
} /* lit_char_is_unicode_non_letter_ident_part */ } /* lit_char_is_unicode_non_letter_ident_part */
/**
* Checks whether the next UTF8 character is a valid identifier start.
*
* @return true if it is.
*/
bool
lit_char_is_identifier_start (const uint8_t *src_p) /**< pointer to a vaild UTF8 character */
{
if (*src_p <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
{
return lit_char_is_identifier_start_character (*src_p);
}
return lit_char_is_identifier_start_character (lit_utf8_peek_next (src_p));
} /* lit_char_is_identifier_start */
/**
* Checks whether the character is a valid identifier start.
*
* @return true if it is.
*/
bool
lit_char_is_identifier_start_character (uint16_t chr) /**< EcmaScript character */
{
// Fast path for ASCII-defined letters
if (chr <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
{
return ((LEXER_TO_ASCII_LOWERCASE (chr) >= LIT_CHAR_LOWERCASE_A
&& LEXER_TO_ASCII_LOWERCASE (chr) <= LIT_CHAR_LOWERCASE_Z)
|| chr == LIT_CHAR_DOLLAR_SIGN
|| chr == LIT_CHAR_UNDERSCORE);
}
return lit_char_is_unicode_letter (chr);
} /* lit_char_is_identifier_start_character */
/**
* Checks whether the next UTF8 character is a valid identifier part.
*
* @return true if it is.
*/
bool
lit_char_is_identifier_part (const uint8_t *src_p) /**< pointer to a vaild UTF8 character */
{
if (*src_p <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
{
return lit_char_is_identifier_part_character (*src_p);
}
return lit_char_is_identifier_part_character (lit_utf8_peek_next (src_p));
} /* lit_char_is_identifier_part */
/**
* Checks whether the character is a valid identifier part.
*
* @return true if it is.
*/
bool
lit_char_is_identifier_part_character (uint16_t chr) /**< EcmaScript character */
{
// Fast path for ASCII-defined letters
if (chr <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
{
return ((LEXER_TO_ASCII_LOWERCASE (chr) >= LIT_CHAR_LOWERCASE_A
&& LEXER_TO_ASCII_LOWERCASE (chr) <= LIT_CHAR_LOWERCASE_Z)
|| (chr >= LIT_CHAR_0 && chr <= LIT_CHAR_9)
|| chr == LIT_CHAR_DOLLAR_SIGN
|| chr == LIT_CHAR_UNDERSCORE);
}
return (lit_char_is_unicode_letter (chr)
|| lit_char_is_unicode_non_letter_ident_part (chr));
} /* lit_char_is_identifier_part_character */
/** /**
* Check if specified character is one of OctalDigit characters (ECMA-262 v5, B.1.2) * Check if specified character is one of OctalDigit characters (ECMA-262 v5, B.1.2)
* *
@@ -253,8 +309,8 @@ bool
lit_char_is_hex_digit (ecma_char_t c) /**< code unit */ lit_char_is_hex_digit (ecma_char_t c) /**< code unit */
{ {
return ((c >= LIT_CHAR_ASCII_DIGITS_BEGIN && c <= LIT_CHAR_ASCII_DIGITS_END) return ((c >= LIT_CHAR_ASCII_DIGITS_BEGIN && c <= LIT_CHAR_ASCII_DIGITS_END)
|| (c >= LIT_CHAR_ASCII_LOWERCASE_LETTERS_HEX_BEGIN && c <= LIT_CHAR_ASCII_LOWERCASE_LETTERS_HEX_END) || (LEXER_TO_ASCII_LOWERCASE (c) >= LIT_CHAR_ASCII_LOWERCASE_LETTERS_HEX_BEGIN
|| (c >= LIT_CHAR_ASCII_UPPERCASE_LETTERS_HEX_BEGIN && c <= LIT_CHAR_ASCII_UPPERCASE_LETTERS_HEX_END)); && LEXER_TO_ASCII_LOWERCASE (c) <= LIT_CHAR_ASCII_LOWERCASE_LETTERS_HEX_END));
} /* lit_char_is_hex_digit */ } /* lit_char_is_hex_digit */
/** /**
@@ -282,6 +338,63 @@ lit_char_hex_to_int (ecma_char_t c) /**< code unit, corresponding to
} }
} /* lit_char_hex_to_int */ } /* lit_char_hex_to_int */
/**
* Converts a character to UTF8 bytes.
*
* @return length of the UTF8 representation.
*/
size_t
lit_char_to_utf8_bytes (uint8_t *dst_p, /**< destination buffer */
ecma_char_t chr) /**< EcmaScript character */
{
if (!(chr & ~LIT_UTF8_1_BYTE_CODE_POINT_MAX))
{
/* 00000000 0xxxxxxx -> 0xxxxxxx */
*dst_p = (uint8_t) chr;
return 1;
}
if (!(chr & ~LIT_UTF8_2_BYTE_CODE_POINT_MAX))
{
/* 00000yyy yyxxxxxx -> 110yyyyy 10xxxxxx */
*(dst_p++) = (uint8_t) (LIT_UTF8_2_BYTE_MARKER | ((chr >> 6) & LIT_UTF8_LAST_5_BITS_MASK));
*dst_p = (uint8_t) (LIT_UTF8_EXTRA_BYTE_MARKER | (chr & LIT_UTF8_LAST_6_BITS_MASK));
return 2;
}
JERRY_ASSERT (!(chr & ~LIT_UTF8_3_BYTE_CODE_POINT_MAX));
/* zzzzyyyy yyxxxxxx -> 1110zzzz 10yyyyyy 10xxxxxx */
*(dst_p++) = (uint8_t) (LIT_UTF8_3_BYTE_MARKER | ((chr >> 12) & LIT_UTF8_LAST_4_BITS_MASK));
*(dst_p++) = (uint8_t) (LIT_UTF8_EXTRA_BYTE_MARKER | ((chr >> 6) & LIT_UTF8_LAST_6_BITS_MASK));
*dst_p = (uint8_t) (LIT_UTF8_EXTRA_BYTE_MARKER | (chr & LIT_UTF8_LAST_6_BITS_MASK));
return 3;
} /* lit_char_to_utf8_bytes */
/**
* Returns the length of the UTF8 representation of a character.
*
* @return length of the UTF8 representation.
*/
size_t
lit_char_get_utf8_length (ecma_char_t chr) /**< EcmaScript character */
{
if (!(chr & ~LIT_UTF8_1_BYTE_CODE_POINT_MAX))
{
/* 00000000 0xxxxxxx */
return 1;
}
if (!(chr & ~LIT_UTF8_2_BYTE_CODE_POINT_MAX))
{
/* 00000yyy yyxxxxxx */
return 2;
}
/* zzzzyyyy yyxxxxxx */
JERRY_ASSERT (!(chr & ~LIT_UTF8_3_BYTE_CODE_POINT_MAX));
return 3;
} /* lit_char_get_utf8_length */
/** /**
* Parse the next number_of_characters hexadecimal character, * Parse the next number_of_characters hexadecimal character,
* and construct a code unit from them. The buffer must * and construct a code unit from them. The buffer must
+8 -2
View File
@@ -78,8 +78,10 @@ extern bool lit_char_is_line_terminator (ecma_char_t);
#define LIT_CHAR_UNDERSCORE ((ecma_char_t) '_') /* low line (underscore) */ #define LIT_CHAR_UNDERSCORE ((ecma_char_t) '_') /* low line (underscore) */
/* LIT_CHAR_BACKSLASH defined above */ /* LIT_CHAR_BACKSLASH defined above */
extern bool lit_char_is_unicode_letter (ecma_char_t); extern bool lit_char_is_identifier_start (const uint8_t *);
extern bool lit_char_is_unicode_non_letter_ident_part (ecma_char_t); extern bool lit_char_is_identifier_part (const uint8_t *);
extern bool lit_char_is_identifier_start_character (ecma_char_t);
extern bool lit_char_is_identifier_part_character (ecma_char_t);
/* /*
* Punctuator characters (ECMA-262 v5, 7.7) * Punctuator characters (ECMA-262 v5, 7.7)
@@ -210,10 +212,14 @@ extern bool lit_char_is_unicode_non_letter_ident_part (ecma_char_t);
#define LIT_CHAR_ASCII_DIGITS_BEGIN LIT_CHAR_0 /* decimal digits range */ #define LIT_CHAR_ASCII_DIGITS_BEGIN LIT_CHAR_0 /* decimal digits range */
#define LIT_CHAR_ASCII_DIGITS_END LIT_CHAR_9 #define LIT_CHAR_ASCII_DIGITS_END LIT_CHAR_9
#define LEXER_TO_ASCII_LOWERCASE(character) ((character) | LIT_CHAR_SP)
extern bool lit_char_is_octal_digit (ecma_char_t); extern bool lit_char_is_octal_digit (ecma_char_t);
extern bool lit_char_is_decimal_digit (ecma_char_t); extern bool lit_char_is_decimal_digit (ecma_char_t);
extern bool lit_char_is_hex_digit (ecma_char_t); extern bool lit_char_is_hex_digit (ecma_char_t);
extern uint32_t lit_char_hex_to_int (ecma_char_t); extern uint32_t lit_char_hex_to_int (ecma_char_t);
extern size_t lit_char_to_utf8_bytes (uint8_t *, ecma_char_t);
extern size_t lit_char_get_utf8_length (ecma_char_t);
/* read a hex encoded code point from a zero terminated buffer */ /* read a hex encoded code point from a zero terminated buffer */
bool lit_read_code_unit_from_hex (const lit_utf8_byte_t *, lit_utf8_size_t, ecma_char_ptr_t); bool lit_read_code_unit_from_hex (const lit_utf8_byte_t *, lit_utf8_size_t, ecma_char_ptr_t);
-127
View File
@@ -16,7 +16,6 @@
#include "common.h" #include "common.h"
#include "ecma-helpers.h" #include "ecma-helpers.h"
#include "lit-char-helpers.h"
/** \addtogroup parser Parser /** \addtogroup parser Parser
* @{ * @{
@@ -28,132 +27,6 @@
* @{ * @{
*/ */
/**
* Checks whether the next UTF8 character is a valid identifier start.
*
* @return non-zero if it is.
*/
int
util_is_identifier_start (const uint8_t *src_p) /* pointer to a vaild UTF8 character */
{
if (*src_p <= 127)
{
return util_is_identifier_start_character (*src_p);
}
return util_is_identifier_start_character (lit_utf8_peek_next (src_p));
} /* util_is_identifier_start */
/**
* Checks whether the next UTF8 character is a valid identifier part.
*
* @return non-zero if it is.
*/
int
util_is_identifier_part (const uint8_t *src_p) /* pointer to a vaild UTF8 character */
{
if (*src_p <= 127)
{
return util_is_identifier_part_character (*src_p);
}
return util_is_identifier_part_character (lit_utf8_peek_next (src_p));
} /* util_is_identifier_part */
/**
* Checks whether the character is a valid identifier start.
*
* @return non-zero if it is.
*/
int
util_is_identifier_start_character (uint16_t chr) /**< EcmaScript character */
{
if (chr <= 127)
{
return (((chr | 0x20) >= LIT_CHAR_LOWERCASE_A && (chr | 0x20) <= LIT_CHAR_LOWERCASE_Z)
|| chr == LIT_CHAR_DOLLAR_SIGN
|| chr == LIT_CHAR_UNDERSCORE);
}
return lit_char_is_unicode_letter (chr);
} /* util_is_identifier_start_character */
/**
* Checks whether the character is a valid identifier part.
*
* @return non-zero if it is.
*/
int
util_is_identifier_part_character (uint16_t chr) /**< EcmaScript character */
{
if (chr <= 127)
{
return (((chr | 0x20) >= LIT_CHAR_LOWERCASE_A && (chr | 0x20) <= LIT_CHAR_LOWERCASE_Z)
|| (chr >= LIT_CHAR_0 && chr <= LIT_CHAR_9)
|| chr == LIT_CHAR_DOLLAR_SIGN
|| chr == LIT_CHAR_UNDERSCORE);
}
return (lit_char_is_unicode_letter (chr)
|| lit_char_is_unicode_non_letter_ident_part (chr));
} /* util_is_identifier_part_character */
/**
* Converts a character to UTF8 bytes.
*
* @return length of the UTF8 representation.
*/
size_t
util_to_utf8_bytes (uint8_t *dst_p, /**< destination buffer */
uint16_t chr) /**< EcmaScript character */
{
if (!(chr & ~0x007f))
{
/* 00000000 0xxxxxxx -> 0xxxxxxx */
*dst_p = (uint8_t) chr;
return 1;
}
if (!(chr & ~0x07ff))
{
/* 00000yyy yyxxxxxx -> 110yyyyy 10xxxxxx */
*(dst_p++) = (uint8_t) (0xc0 | ((chr >> 6) & 0x1f));
*dst_p = (uint8_t) (0x80 | (chr & 0x3f));
return 2;
}
/* zzzzyyyy yyxxxxxx -> 1110zzzz 10yyyyyy 10xxxxxx */
*(dst_p++) = (uint8_t) (0xe0 | ((chr >> 12) & 0x0f));
*(dst_p++) = (uint8_t) (0x80 | ((chr >> 6) & 0x3f));
*dst_p = (uint8_t) (0x80 | (chr & 0x3f));
return 3;
} /* util_to_utf8_bytes */
/**
* Returns the length of the UTF8 representation of a character.
*
* @return length of the UTF8 representation.
*/
size_t
util_get_utf8_length (uint16_t chr) /**< EcmaScript character */
{
if (!(chr & ~0x007f))
{
/* 00000000 0xxxxxxx */
return 1;
}
if (!(chr & ~0x07ff))
{
/* 00000yyy yyxxxxxx */
return 2;
}
/* zzzzyyyy yyxxxxxx */
return 3;
} /* util_get_utf8_length */
/** /**
* Free literal. * Free literal.
*/ */
-10
View File
@@ -47,16 +47,6 @@
#include "lit-literal.h" #include "lit-literal.h"
#include "mem-heap.h" #include "mem-heap.h"
/* UTF character management. Only ASCII characters are
* supported for simplicity. */
int util_is_identifier_start (const uint8_t *);
int util_is_identifier_part (const uint8_t *);
int util_is_identifier_start_character (uint16_t);
int util_is_identifier_part_character (uint16_t);
size_t util_to_utf8_bytes (uint8_t *, uint16_t);
size_t util_get_utf8_length (uint16_t);
/* Immediate management. */ /* Immediate management. */
/** /**
+184 -214
View File
@@ -31,7 +31,7 @@
* @{ * @{
*/ */
#define IS_UTF8_INTERMEDIATE_OCTET(byte) (((byte) & 0xc0) == 0x80) #define IS_UTF8_INTERMEDIATE_OCTET(byte) (((byte) & LIT_UTF8_EXTRA_BYTE_MASK) == LIT_UTF8_2_BYTE_CODE_POINT_MIN)
/** /**
* Align column to the next tab position. * Align column to the next tab position.
@@ -42,7 +42,7 @@ static parser_line_counter_t
align_column_to_tab (parser_line_counter_t column) /**< current column */ align_column_to_tab (parser_line_counter_t column) /**< current column */
{ {
/* Tab aligns to zero column start position. */ /* Tab aligns to zero column start position. */
return (parser_line_counter_t) (((column + (8u - 1u)) & ~0x7u) + 1u); return (parser_line_counter_t) (((column + (8u - 1u)) & ~ECMA_STRING_CONTAINER_MASK) + 1u);
} /* align_column_to_tab */ } /* align_column_to_tab */
/** /**
@@ -50,7 +50,7 @@ align_column_to_tab (parser_line_counter_t column) /**< current column */
* *
* @return character value * @return character value
*/ */
static ecma_char_t ecma_char_t
lexer_hex_to_character (parser_context_t *context_p, /**< context */ lexer_hex_to_character (parser_context_t *context_p, /**< context */
const uint8_t *source_p, /**< current source position */ const uint8_t *source_p, /**< current source position */
int length) /**< source length */ int length) /**< source length */
@@ -63,16 +63,16 @@ lexer_hex_to_character (parser_context_t *context_p, /**< context */
result <<= 4; result <<= 4;
if (byte >= '0' && byte <= '9') if (byte >= LIT_CHAR_0 && byte <= LIT_CHAR_9)
{ {
result += byte - '0'; result += byte - LIT_CHAR_0;
} }
else else
{ {
byte |= 0x20; byte = LEXER_TO_ASCII_LOWERCASE (byte);
if (byte >= 'a' && byte <= 'f') if (byte >= LIT_CHAR_LOWERCASE_A && byte <= LIT_CHAR_LOWERCASE_F)
{ {
result += byte - ('a' - 10); result += byte - (LIT_CHAR_LOWERCASE_A - 10);
} }
else else
{ {
@@ -142,9 +142,9 @@ skip_spaces (parser_context_t *context_p) /**< context */
/* FALLTHRU */ /* FALLTHRU */
} }
case 0x0b: case LIT_CHAR_VTAB:
case 0x0c: case LIT_CHAR_FF:
case 0x20: case LIT_CHAR_SP:
{ {
context_p->source_p++; context_p->source_p++;
context_p->column++; context_p->column++;
@@ -158,16 +158,16 @@ skip_spaces (parser_context_t *context_p) /**< context */
continue; continue;
} }
case '/': case LIT_CHAR_SLASH:
{ {
if (mode == LEXER_SKIP_SPACES if (mode == LEXER_SKIP_SPACES
&& context_p->source_p + 1 < source_end_p) && context_p->source_p + 1 < source_end_p)
{ {
if (context_p->source_p[1] == '/') if (context_p->source_p[1] == LIT_CHAR_SLASH)
{ {
mode = LEXER_SKIP_SINGLE_LINE_COMMENT; mode = LEXER_SKIP_SINGLE_LINE_COMMENT;
} }
else if (context_p->source_p[1] == '*') else if (context_p->source_p[1] == LIT_CHAR_ASTERISK)
{ {
mode = LEXER_SKIP_MULTI_LINE_COMMENT; mode = LEXER_SKIP_MULTI_LINE_COMMENT;
context_p->token.line = context_p->line; context_p->token.line = context_p->line;
@@ -184,11 +184,11 @@ skip_spaces (parser_context_t *context_p) /**< context */
break; break;
} }
case '*': case LIT_CHAR_ASTERISK:
{ {
if (mode == LEXER_SKIP_MULTI_LINE_COMMENT if (mode == LEXER_SKIP_MULTI_LINE_COMMENT
&& context_p->source_p + 1 < source_end_p && context_p->source_p + 1 < source_end_p
&& context_p->source_p[1] == '/') && context_p->source_p[1] == LIT_CHAR_SLASH)
{ {
mode = LEXER_SKIP_SPACES; mode = LEXER_SKIP_SPACES;
context_p->source_p += 2; context_p->source_p += 2;
@@ -436,7 +436,7 @@ lexer_parse_identifier (parser_context_t *context_p, /**< context */
do do
{ {
if (*source_p == '\\') if (*source_p == LIT_CHAR_BACKSLASH)
{ {
uint16_t character; uint16_t character;
@@ -444,7 +444,7 @@ lexer_parse_identifier (parser_context_t *context_p, /**< context */
context_p->source_p = source_p; context_p->source_p = source_p;
context_p->token.column = column; context_p->token.column = column;
if ((source_p + 6 > source_end_p) || (source_p[1] != 'u')) if ((source_p + 6 > source_end_p) || (source_p[1] != LIT_CHAR_LOWERCASE_U))
{ {
parser_raise_error (context_p, PARSER_ERR_INVALID_UNICODE_ESCAPE_SEQUENCE); parser_raise_error (context_p, PARSER_ERR_INVALID_UNICODE_ESCAPE_SEQUENCE);
} }
@@ -453,20 +453,20 @@ lexer_parse_identifier (parser_context_t *context_p, /**< context */
if (length == 0) if (length == 0)
{ {
if (!util_is_identifier_start_character (character)) if (!lit_char_is_identifier_start_character (character))
{ {
parser_raise_error (context_p, PARSER_ERR_INVALID_IDENTIFIER_START); parser_raise_error (context_p, PARSER_ERR_INVALID_IDENTIFIER_START);
} }
} }
else else
{ {
if (!util_is_identifier_part_character (character)) if (!lit_char_is_identifier_part_character (character))
{ {
parser_raise_error (context_p, PARSER_ERR_INVALID_IDENTIFIER_PART); parser_raise_error (context_p, PARSER_ERR_INVALID_IDENTIFIER_PART);
} }
} }
length += util_get_utf8_length (character); length += lit_char_get_utf8_length (character);
source_p += 6; source_p += 6;
PARSER_PLUS_EQUAL_LC (column, 6); PARSER_PLUS_EQUAL_LC (column, 6);
continue; continue;
@@ -490,7 +490,7 @@ lexer_parse_identifier (parser_context_t *context_p, /**< context */
} }
} }
while (source_p < source_end_p while (source_p < source_end_p
&& (util_is_identifier_part (source_p) || *source_p == '\\')); && (lit_char_is_identifier_part (source_p) || *source_p == LIT_CHAR_BACKSLASH));
context_p->source_p = ident_start_p; context_p->source_p = ident_start_p;
context_p->token.column = context_p->column; context_p->token.column = context_p->column;
@@ -574,7 +574,7 @@ lexer_parse_string (parser_context_t *context_p) /**< context */
break; break;
} }
if (*source_p == '\\') if (*source_p == LIT_CHAR_BACKSLASH)
{ {
source_p++; source_p++;
column++; column++;
@@ -616,7 +616,7 @@ lexer_parse_string (parser_context_t *context_p) /**< context */
/* Except \x, \u, and octal numbers, everything is /* Except \x, \u, and octal numbers, everything is
* converted to a character which has the same byte length. */ * converted to a character which has the same byte length. */
if (*source_p >= '0' && *source_p <= '3') if (*source_p >= LIT_CHAR_0 && *source_p <= LIT_CHAR_3)
{ {
if (context_p->status_flags & PARSER_IS_STRICT) if (context_p->status_flags & PARSER_IS_STRICT)
{ {
@@ -626,16 +626,16 @@ lexer_parse_string (parser_context_t *context_p) /**< context */
source_p++; source_p++;
column++; column++;
if (source_p < source_end_p && *source_p >= '0' && *source_p <= '7') if (source_p < source_end_p && *source_p >= LIT_CHAR_0 && *source_p <= LIT_CHAR_7)
{ {
source_p++; source_p++;
column++; column++;
if (source_p < source_end_p && *source_p >= '0' && *source_p <= '7') if (source_p < source_end_p && *source_p >= LIT_CHAR_0 && *source_p <= LIT_CHAR_7)
{ {
/* Numbers >= 0x200 (0x80) requires /* Numbers >= 0x200 (0x80) requires
* two bytes for encoding in UTF-8. */ * two bytes for encoding in UTF-8. */
if (source_p[-2] >= '2') if (source_p[-2] >= LIT_CHAR_2)
{ {
length++; length++;
} }
@@ -649,7 +649,7 @@ lexer_parse_string (parser_context_t *context_p) /**< context */
continue; continue;
} }
if (*source_p >= '4' && *source_p <= '7') if (*source_p >= LIT_CHAR_4 && *source_p <= LIT_CHAR_7)
{ {
if (context_p->status_flags & PARSER_IS_STRICT) if (context_p->status_flags & PARSER_IS_STRICT)
{ {
@@ -659,7 +659,7 @@ lexer_parse_string (parser_context_t *context_p) /**< context */
source_p++; source_p++;
column++; column++;
if (source_p < source_end_p && *source_p >= '0' && *source_p <= '7') if (source_p < source_end_p && *source_p >= LIT_CHAR_0 && *source_p <= LIT_CHAR_7)
{ {
source_p++; source_p++;
column++; column++;
@@ -671,9 +671,9 @@ lexer_parse_string (parser_context_t *context_p) /**< context */
continue; continue;
} }
if (*source_p == 'x' || *source_p == 'u') if (*source_p == LIT_CHAR_LOWERCASE_X || *source_p == LIT_CHAR_LOWERCASE_U)
{ {
uint8_t hex_part_length = (*source_p == 'x') ? 2 : 4; uint8_t hex_part_length = (*source_p == LIT_CHAR_LOWERCASE_X) ? 2 : 4;
context_p->token.line = line; context_p->token.line = line;
context_p->token.column = (parser_line_counter_t) (column - 1); context_p->token.column = (parser_line_counter_t) (column - 1);
@@ -682,9 +682,9 @@ lexer_parse_string (parser_context_t *context_p) /**< context */
parser_raise_error (context_p, PARSER_ERR_INVALID_ESCAPE_SEQUENCE); parser_raise_error (context_p, PARSER_ERR_INVALID_ESCAPE_SEQUENCE);
} }
length += util_get_utf8_length (lexer_hex_to_character (context_p, length += lit_char_get_utf8_length (lexer_hex_to_character (context_p,
source_p + 1, source_p + 1,
hex_part_length)); hex_part_length));
source_p += hex_part_length + 1; source_p += hex_part_length + 1;
PARSER_PLUS_EQUAL_LC (column, hex_part_length + 1u); PARSER_PLUS_EQUAL_LC (column, hex_part_length + 1u);
continue; continue;
@@ -747,17 +747,6 @@ lexer_parse_string (parser_context_t *context_p) /**< context */
context_p->column = (parser_line_counter_t) (column + 1); context_p->column = (parser_line_counter_t) (column + 1);
} /* lexer_parse_string */ } /* lexer_parse_string */
/**
* Checks whether the character is hex digit.
*
* @return non-zero if the character is hex digit.
*/
static int
lexer_is_hex_digit (uint8_t character) /**< input character */
{
return (character >= '0' && character <= '9') || ((character | 0x20) >= 'a' && (character | 0x20) <= 'f');
} /* lexer_is_hex_digit */
/** /**
* Parse number. * Parse number.
*/ */
@@ -776,16 +765,16 @@ lexer_parse_number (parser_context_t *context_p) /**< context */
context_p->token.lit_location.type = LEXER_NUMBER_LITERAL; context_p->token.lit_location.type = LEXER_NUMBER_LITERAL;
context_p->token.lit_location.has_escape = PARSER_FALSE; context_p->token.lit_location.has_escape = PARSER_FALSE;
if (source_p[0] == '0' if (source_p[0] == LIT_CHAR_0
&& source_p + 1 < source_end_p) && source_p + 1 < source_end_p)
{ {
if ((source_p[1] | 0x20) == 'x') if (LEXER_TO_ASCII_LOWERCASE (source_p[1]) == LIT_CHAR_LOWERCASE_X)
{ {
context_p->token.extra_value = LEXER_NUMBER_HEXADECIMAL; context_p->token.extra_value = LEXER_NUMBER_HEXADECIMAL;
source_p += 2; source_p += 2;
if (source_p >= source_end_p if (source_p >= source_end_p
|| !lexer_is_hex_digit (source_p[0])) || !lit_char_is_hex_digit (source_p[0]))
{ {
parser_raise_error (context_p, PARSER_ERR_INVALID_HEX_DIGIT); parser_raise_error (context_p, PARSER_ERR_INVALID_HEX_DIGIT);
} }
@@ -795,10 +784,10 @@ lexer_parse_number (parser_context_t *context_p) /**< context */
source_p++; source_p++;
} }
while (source_p < source_end_p while (source_p < source_end_p
&& lexer_is_hex_digit (source_p[0])); && lit_char_is_hex_digit (source_p[0]));
} }
else if (source_p[1] >= '0' else if (source_p[1] >= LIT_CHAR_0
&& source_p[1] <= '7') && source_p[1] <= LIT_CHAR_7)
{ {
context_p->token.extra_value = LEXER_NUMBER_OCTAL; context_p->token.extra_value = LEXER_NUMBER_OCTAL;
@@ -812,18 +801,18 @@ lexer_parse_number (parser_context_t *context_p) /**< context */
source_p++; source_p++;
} }
while (source_p < source_end_p while (source_p < source_end_p
&& source_p[0] >= '0' && source_p[0] >= LIT_CHAR_0
&& source_p[0] <= '7'); && source_p[0] <= LIT_CHAR_7);
if (source_p < source_end_p if (source_p < source_end_p
&& source_p[0] >= '8' && source_p[0] >= LIT_CHAR_8
&& source_p[0] <= '9') && source_p[0] <= LIT_CHAR_9)
{ {
parser_raise_error (context_p, PARSER_ERR_INVALID_NUMBER); parser_raise_error (context_p, PARSER_ERR_INVALID_NUMBER);
} }
} }
else if (source_p[1] >= '8' else if (source_p[1] >= LIT_CHAR_8
&& source_p[1] <= '9') && source_p[1] <= LIT_CHAR_9)
{ {
parser_raise_error (context_p, PARSER_ERR_INVALID_NUMBER); parser_raise_error (context_p, PARSER_ERR_INVALID_NUMBER);
} }
@@ -840,8 +829,8 @@ lexer_parse_number (parser_context_t *context_p) /**< context */
source_p++; source_p++;
} }
while (source_p < source_end_p while (source_p < source_end_p
&& source_p[0] >= '0' && source_p[0] >= LIT_CHAR_0
&& source_p[0] <= '9'); && source_p[0] <= LIT_CHAR_9);
can_be_float = PARSER_TRUE; can_be_float = PARSER_TRUE;
} }
@@ -849,31 +838,31 @@ lexer_parse_number (parser_context_t *context_p) /**< context */
if (can_be_float) if (can_be_float)
{ {
if (source_p < source_end_p if (source_p < source_end_p
&& source_p[0] == '.') && source_p[0] == LIT_CHAR_DOT)
{ {
source_p++; source_p++;
while (source_p < source_end_p while (source_p < source_end_p
&& source_p[0] >= '0' && source_p[0] >= LIT_CHAR_0
&& source_p[0] <= '9') && source_p[0] <= LIT_CHAR_9)
{ {
source_p++; source_p++;
} }
} }
if (source_p < source_end_p if (source_p < source_end_p
&& (source_p[0] | 0x20) == 'e') && LEXER_TO_ASCII_LOWERCASE (source_p[0]) == LIT_CHAR_LOWERCASE_E)
{ {
source_p++; source_p++;
if (source_p < source_end_p if (source_p < source_end_p
&& (source_p[0] == '+' || source_p[0] == '-')) && (source_p[0] == LIT_CHAR_PLUS || source_p[0] == LIT_CHAR_MINUS))
{ {
source_p++; source_p++;
} }
if (source_p >= source_end_p if (source_p >= source_end_p
|| source_p[0] < '0' || source_p[0] < LIT_CHAR_0
|| source_p[0] > '9') || source_p[0] > LIT_CHAR_9)
{ {
parser_raise_error (context_p, PARSER_ERR_MISSING_EXPONENT); parser_raise_error (context_p, PARSER_ERR_MISSING_EXPONENT);
} }
@@ -883,13 +872,13 @@ lexer_parse_number (parser_context_t *context_p) /**< context */
source_p++; source_p++;
} }
while (source_p < source_end_p while (source_p < source_end_p
&& source_p[0] >= '0' && source_p[0] >= LIT_CHAR_0
&& source_p[0] <= '9'); && source_p[0] <= LIT_CHAR_9);
} }
} }
if (source_p < source_end_p if (source_p < source_end_p
&& (util_is_identifier_start (source_p) || source_p[0] == '\\')) && (lit_char_is_identifier_start (source_p) || source_p[0] == LIT_CHAR_BACKSLASH))
{ {
parser_raise_error (context_p, PARSER_ERR_IDENTIFIER_AFTER_NUMBER); parser_raise_error (context_p, PARSER_ERR_IDENTIFIER_AFTER_NUMBER);
} }
@@ -995,14 +984,14 @@ lexer_next_token (parser_context_t *context_p) /**< context */
return; return;
} }
if (util_is_identifier_start (context_p->source_p) if (lit_char_is_identifier_start (context_p->source_p)
|| context_p->source_p[0] == '\\') || context_p->source_p[0] == LIT_CHAR_BACKSLASH)
{ {
lexer_parse_identifier (context_p, PARSER_TRUE); lexer_parse_identifier (context_p, PARSER_TRUE);
return; return;
} }
if (context_p->source_p[0] >= '0' && context_p->source_p[0] <= '9') if (context_p->source_p[0] >= LIT_CHAR_0 && context_p->source_p[0] <= LIT_CHAR_9)
{ {
lexer_parse_number (context_p); lexer_parse_number (context_p);
return; return;
@@ -1010,19 +999,19 @@ lexer_next_token (parser_context_t *context_p) /**< context */
switch (context_p->source_p[0]) switch (context_p->source_p[0])
{ {
LEXER_TYPE_A_TOKEN ('{', LEXER_LEFT_BRACE); LEXER_TYPE_A_TOKEN (LIT_CHAR_LEFT_BRACE, LEXER_LEFT_BRACE);
LEXER_TYPE_A_TOKEN ('(', LEXER_LEFT_PAREN); LEXER_TYPE_A_TOKEN (LIT_CHAR_LEFT_PAREN, LEXER_LEFT_PAREN);
LEXER_TYPE_A_TOKEN ('[', LEXER_LEFT_SQUARE); LEXER_TYPE_A_TOKEN (LIT_CHAR_LEFT_SQUARE, LEXER_LEFT_SQUARE);
LEXER_TYPE_A_TOKEN ('}', LEXER_RIGHT_BRACE); LEXER_TYPE_A_TOKEN (LIT_CHAR_RIGHT_BRACE, LEXER_RIGHT_BRACE);
LEXER_TYPE_A_TOKEN (')', LEXER_RIGHT_PAREN); LEXER_TYPE_A_TOKEN (LIT_CHAR_RIGHT_PAREN, LEXER_RIGHT_PAREN);
LEXER_TYPE_A_TOKEN (']', LEXER_RIGHT_SQUARE); LEXER_TYPE_A_TOKEN (LIT_CHAR_RIGHT_SQUARE, LEXER_RIGHT_SQUARE);
LEXER_TYPE_A_TOKEN (';', LEXER_SEMICOLON); LEXER_TYPE_A_TOKEN (LIT_CHAR_SEMICOLON, LEXER_SEMICOLON);
LEXER_TYPE_A_TOKEN (',', LEXER_COMMA); LEXER_TYPE_A_TOKEN (LIT_CHAR_COMMA, LEXER_COMMA);
case (uint8_t) '.' : case (uint8_t) LIT_CHAR_DOT :
{ {
if (length >= 2 if (length >= 2
&& (context_p->source_p[1] >= '0' && context_p->source_p[1] <= '9')) && (context_p->source_p[1] >= LIT_CHAR_0 && context_p->source_p[1] <= LIT_CHAR_9))
{ {
lexer_parse_number (context_p); lexer_parse_number (context_p);
return; return;
@@ -1033,20 +1022,20 @@ lexer_next_token (parser_context_t *context_p) /**< context */
break; break;
} }
case (uint8_t) '<': case (uint8_t) LIT_CHAR_LESS_THAN:
{ {
if (length >= 2) if (length >= 2)
{ {
if (context_p->source_p[1] == (uint8_t) '=') if (context_p->source_p[1] == (uint8_t) LIT_CHAR_EQUALS)
{ {
context_p->token.type = LEXER_LESS_EQUAL; context_p->token.type = LEXER_LESS_EQUAL;
length = 2; length = 2;
break; break;
} }
if (context_p->source_p[1] == (uint8_t) '<') if (context_p->source_p[1] == (uint8_t) LIT_CHAR_LESS_THAN)
{ {
if (length >= 3 && context_p->source_p[2] == (uint8_t) '=') if (length >= 3 && context_p->source_p[2] == (uint8_t) LIT_CHAR_EQUALS)
{ {
context_p->token.type = LEXER_ASSIGN_LEFT_SHIFT; context_p->token.type = LEXER_ASSIGN_LEFT_SHIFT;
length = 3; length = 3;
@@ -1064,31 +1053,31 @@ lexer_next_token (parser_context_t *context_p) /**< context */
break; break;
} }
case '>': case LIT_CHAR_GREATER_THAN:
{ {
if (length >= 2) if (length >= 2)
{ {
if (context_p->source_p[1] == (uint8_t) '=') if (context_p->source_p[1] == (uint8_t) LIT_CHAR_EQUALS)
{ {
context_p->token.type = LEXER_GREATER_EQUAL; context_p->token.type = LEXER_GREATER_EQUAL;
length = 2; length = 2;
break; break;
} }
if (context_p->source_p[1] == (uint8_t) '>') if (context_p->source_p[1] == (uint8_t) LIT_CHAR_GREATER_THAN)
{ {
if (length >= 3) if (length >= 3)
{ {
if (context_p->source_p[2] == (uint8_t) '=') if (context_p->source_p[2] == (uint8_t) LIT_CHAR_EQUALS)
{ {
context_p->token.type = LEXER_ASSIGN_RIGHT_SHIFT; context_p->token.type = LEXER_ASSIGN_RIGHT_SHIFT;
length = 3; length = 3;
break; break;
} }
if (context_p->source_p[2] == (uint8_t) '>') if (context_p->source_p[2] == (uint8_t) LIT_CHAR_GREATER_THAN)
{ {
if (length >= 4 && context_p->source_p[3] == (uint8_t) '=') if (length >= 4 && context_p->source_p[3] == (uint8_t) LIT_CHAR_EQUALS)
{ {
context_p->token.type = LEXER_ASSIGN_UNS_RIGHT_SHIFT; context_p->token.type = LEXER_ASSIGN_UNS_RIGHT_SHIFT;
length = 4; length = 4;
@@ -1112,27 +1101,37 @@ lexer_next_token (parser_context_t *context_p) /**< context */
break; break;
} }
LEXER_TYPE_D_TOKEN ('=', LEXER_ASSIGN, '=', LEXER_EQUAL, '=', LEXER_STRICT_EQUAL) LEXER_TYPE_D_TOKEN (LIT_CHAR_EQUALS, LEXER_ASSIGN, LIT_CHAR_EQUALS,
LEXER_TYPE_D_TOKEN ('!', LEXER_LOGICAL_NOT, '=', LEXER_NOT_EQUAL, '=', LEXER_STRICT_NOT_EQUAL) LEXER_EQUAL, LIT_CHAR_EQUALS, LEXER_STRICT_EQUAL)
LEXER_TYPE_D_TOKEN (LIT_CHAR_EXCLAMATION, LEXER_LOGICAL_NOT, LIT_CHAR_EQUALS,
LEXER_NOT_EQUAL, LIT_CHAR_EQUALS, LEXER_STRICT_NOT_EQUAL)
LEXER_TYPE_C_TOKEN ('+', LEXER_ADD, '=', LEXER_ASSIGN_ADD, '+', LEXER_INCREASE) LEXER_TYPE_C_TOKEN (LIT_CHAR_PLUS, LEXER_ADD, LIT_CHAR_EQUALS,
LEXER_TYPE_C_TOKEN ('-', LEXER_SUBTRACT, '=', LEXER_ASSIGN_SUBTRACT, '-', LEXER_DECREASE) LEXER_ASSIGN_ADD, LIT_CHAR_PLUS, LEXER_INCREASE)
LEXER_TYPE_C_TOKEN (LIT_CHAR_MINUS, LEXER_SUBTRACT, LIT_CHAR_EQUALS,
LEXER_ASSIGN_SUBTRACT, LIT_CHAR_MINUS, LEXER_DECREASE)
LEXER_TYPE_B_TOKEN ('*', LEXER_MULTIPLY, '=', LEXER_ASSIGN_MULTIPLY) LEXER_TYPE_B_TOKEN (LIT_CHAR_ASTERISK, LEXER_MULTIPLY, LIT_CHAR_EQUALS,
LEXER_TYPE_B_TOKEN ('/', LEXER_DIVIDE, '=', LEXER_ASSIGN_DIVIDE) LEXER_ASSIGN_MULTIPLY)
LEXER_TYPE_B_TOKEN ('%', LEXER_MODULO, '=', LEXER_ASSIGN_MODULO) LEXER_TYPE_B_TOKEN (LIT_CHAR_SLASH, LEXER_DIVIDE, LIT_CHAR_EQUALS,
LEXER_ASSIGN_DIVIDE)
LEXER_TYPE_B_TOKEN (LIT_CHAR_PERCENT, LEXER_MODULO, LIT_CHAR_EQUALS,
LEXER_ASSIGN_MODULO)
LEXER_TYPE_C_TOKEN ('&', LEXER_BIT_AND, '=', LEXER_ASSIGN_BIT_AND, '&', LEXER_LOGICAL_AND) LEXER_TYPE_C_TOKEN (LIT_CHAR_AMPERSAND, LEXER_BIT_AND, LIT_CHAR_EQUALS,
LEXER_TYPE_C_TOKEN ('|', LEXER_BIT_OR, '=', LEXER_ASSIGN_BIT_OR, '|', LEXER_LOGICAL_OR) LEXER_ASSIGN_BIT_AND, LIT_CHAR_AMPERSAND, LEXER_LOGICAL_AND)
LEXER_TYPE_C_TOKEN (LIT_CHAR_VLINE, LEXER_BIT_OR, LIT_CHAR_EQUALS,
LEXER_ASSIGN_BIT_OR, LIT_CHAR_VLINE, LEXER_LOGICAL_OR)
LEXER_TYPE_B_TOKEN ('^', LEXER_BIT_XOR, '=', LEXER_ASSIGN_BIT_XOR) LEXER_TYPE_B_TOKEN (LIT_CHAR_CIRCUMFLEX, LEXER_BIT_XOR, LIT_CHAR_EQUALS,
LEXER_ASSIGN_BIT_XOR)
LEXER_TYPE_A_TOKEN ('~', LEXER_BIT_NOT); LEXER_TYPE_A_TOKEN (LIT_CHAR_TILDE, LEXER_BIT_NOT);
LEXER_TYPE_A_TOKEN ('?', LEXER_QUESTION_MARK); LEXER_TYPE_A_TOKEN (LIT_CHAR_QUESTION, LEXER_QUESTION_MARK);
LEXER_TYPE_A_TOKEN (':', LEXER_COLON); LEXER_TYPE_A_TOKEN (LIT_CHAR_COLON, LEXER_COLON);
case '\'': case LIT_CHAR_SINGLE_QUOTE:
case '"': case LIT_CHAR_DOUBLE_QUOTE:
{ {
lexer_parse_string (context_p); lexer_parse_string (context_p);
return; return;
@@ -1258,10 +1257,10 @@ lexer_construct_literal_object (parser_context_t *context_p, /**< context */
do do
{ {
if (*source_p == '\\') if (*source_p == LIT_CHAR_BACKSLASH)
{ {
destination_p += util_to_utf8_bytes (destination_p, destination_p += lit_char_to_utf8_bytes (destination_p,
lexer_hex_to_character (context_p, source_p + 2, 4)); lexer_hex_to_character (context_p, source_p + 2, 4));
source_p += 6; source_p += 6;
continue; continue;
} }
@@ -1275,7 +1274,7 @@ lexer_construct_literal_object (parser_context_t *context_p, /**< context */
} }
} }
while (source_p < source_end_p while (source_p < source_end_p
&& (util_is_identifier_part (source_p) || *source_p == '\\')); && (lit_char_is_identifier_part (source_p) || *source_p == LIT_CHAR_BACKSLASH));
JERRY_ASSERT (destination_p == destination_start_p + literal_p->length); JERRY_ASSERT (destination_p == destination_start_p + literal_p->length);
} }
@@ -1290,7 +1289,7 @@ lexer_construct_literal_object (parser_context_t *context_p, /**< context */
break; break;
} }
if (*source_p == '\\') if (*source_p == LIT_CHAR_BACKSLASH)
{ {
uint8_t conv_character; uint8_t conv_character;
@@ -1323,41 +1322,41 @@ lexer_construct_literal_object (parser_context_t *context_p, /**< context */
continue; continue;
} }
if (*source_p >= '0' && *source_p <= '3') if (*source_p >= LIT_CHAR_0 && *source_p <= LIT_CHAR_3)
{ {
uint32_t octal_number = (uint32_t) (*source_p - '0'); uint32_t octal_number = (uint32_t) (*source_p - LIT_CHAR_0);
source_p++; source_p++;
JERRY_ASSERT (source_p < context_p->source_end_p); JERRY_ASSERT (source_p < context_p->source_end_p);
if (*source_p >= '0' && *source_p <= '7') if (*source_p >= LIT_CHAR_0 && *source_p <= LIT_CHAR_7)
{ {
octal_number = octal_number * 8 + (uint32_t) (*source_p - '0'); octal_number = octal_number * 8 + (uint32_t) (*source_p - LIT_CHAR_0);
source_p++; source_p++;
JERRY_ASSERT (source_p < context_p->source_end_p); JERRY_ASSERT (source_p < context_p->source_end_p);
if (*source_p >= '0' && *source_p <= '7') if (*source_p >= LIT_CHAR_0 && *source_p <= LIT_CHAR_7)
{ {
octal_number = octal_number * 8 + (uint32_t) (*source_p - '0'); octal_number = octal_number * 8 + (uint32_t) (*source_p - LIT_CHAR_0);
source_p++; source_p++;
JERRY_ASSERT (source_p < context_p->source_end_p); JERRY_ASSERT (source_p < context_p->source_end_p);
} }
} }
destination_p += util_to_utf8_bytes (destination_p, (uint16_t) octal_number); destination_p += lit_char_to_utf8_bytes (destination_p, (uint16_t) octal_number);
continue; continue;
} }
if (*source_p >= '4' && *source_p <= '7') if (*source_p >= LIT_CHAR_4 && *source_p <= LIT_CHAR_7)
{ {
uint32_t octal_number = (uint32_t) (*source_p - '0'); uint32_t octal_number = (uint32_t) (*source_p - LIT_CHAR_0);
source_p++; source_p++;
JERRY_ASSERT (source_p < context_p->source_end_p); JERRY_ASSERT (source_p < context_p->source_end_p);
if (*source_p >= '0' && *source_p <= '7') if (*source_p >= LIT_CHAR_0 && *source_p <= LIT_CHAR_7)
{ {
octal_number = octal_number * 8 + (uint32_t) (*source_p - '0'); octal_number = octal_number * 8 + (uint32_t) (*source_p - LIT_CHAR_0);
source_p++; source_p++;
JERRY_ASSERT (source_p < context_p->source_end_p); JERRY_ASSERT (source_p < context_p->source_end_p);
} }
@@ -1366,15 +1365,15 @@ lexer_construct_literal_object (parser_context_t *context_p, /**< context */
continue; continue;
} }
if (*source_p == 'x' || *source_p == 'u') if (*source_p == LIT_CHAR_LOWERCASE_X || *source_p == LIT_CHAR_LOWERCASE_U)
{ {
int hex_part_length = (*source_p == 'x') ? 2 : 4; int hex_part_length = (*source_p == LIT_CHAR_LOWERCASE_X) ? 2 : 4;
JERRY_ASSERT (source_p + 1 + hex_part_length <= context_p->source_end_p); JERRY_ASSERT (source_p + 1 + hex_part_length <= context_p->source_end_p);
destination_p += util_to_utf8_bytes (destination_p, destination_p += lit_char_to_utf8_bytes (destination_p,
lexer_hex_to_character (context_p, lexer_hex_to_character (context_p,
source_p + 1, source_p + 1,
hex_part_length)); hex_part_length));
source_p += hex_part_length + 1; source_p += hex_part_length + 1;
continue; continue;
} }
@@ -1382,32 +1381,32 @@ lexer_construct_literal_object (parser_context_t *context_p, /**< context */
conv_character = *source_p; conv_character = *source_p;
switch (*source_p) switch (*source_p)
{ {
case 'b': case LIT_CHAR_LOWERCASE_B:
{ {
conv_character = 0x08; conv_character = 0x08;
break; break;
} }
case 't': case LIT_CHAR_LOWERCASE_T:
{ {
conv_character = 0x09; conv_character = 0x09;
break; break;
} }
case 'n': case LIT_CHAR_LOWERCASE_N:
{ {
conv_character = 0x0a; conv_character = 0x0a;
break; break;
} }
case 'v': case LIT_CHAR_LOWERCASE_V:
{ {
conv_character = 0x0b; conv_character = 0x0b;
break; break;
} }
case 'f': case LIT_CHAR_LOWERCASE_F:
{ {
conv_character = 0x0c; conv_character = 0x0c;
break; break;
} }
case 'r': case LIT_CHAR_LOWERCASE_R:
{ {
conv_character = 0x0d; conv_character = 0x0d;
break; break;
@@ -1429,16 +1428,16 @@ lexer_construct_literal_object (parser_context_t *context_p, /**< context */
* long sequence. */ * long sequence. */
uint32_t character = ((((uint32_t) source_p[0]) & 0x7) << 18); uint32_t character = ((((uint32_t) source_p[0]) & 0x7) << 18);
character |= ((((uint32_t) source_p[1]) & 0x3f) << 12); character |= ((((uint32_t) source_p[1]) & LIT_UTF8_LAST_6_BITS_MASK) << 12);
character |= ((((uint32_t) source_p[2]) & 0x3f) << 6); character |= ((((uint32_t) source_p[2]) & LIT_UTF8_LAST_6_BITS_MASK) << 6);
character |= (((uint32_t) source_p[3]) & 0x3f); character |= (((uint32_t) source_p[3]) & LIT_UTF8_LAST_6_BITS_MASK);
JERRY_ASSERT (character >= 0x10000); JERRY_ASSERT (character >= 0x10000);
character -= 0x10000; character -= 0x10000;
destination_p += util_to_utf8_bytes (destination_p, destination_p += lit_char_to_utf8_bytes (destination_p,
(ecma_char_t) (0xd800 | (character >> 10))); (ecma_char_t) (0xd800 | (character >> 10)));
destination_p += util_to_utf8_bytes (destination_p, destination_p += lit_char_to_utf8_bytes (destination_p,
(ecma_char_t) (0xdc00 | (character & 0x3ff))); (ecma_char_t) (0xdc00 | (character & LIT_UTF16_LAST_10_BITS_MASK)));
source_p += 4; source_p += 4;
continue; continue;
} }
@@ -1476,17 +1475,17 @@ lexer_construct_literal_object (parser_context_t *context_p, /**< context */
} }
if (literal_p->length == 4 if (literal_p->length == 4
&& source_p[0] == 'e' && source_p[0] == LIT_CHAR_LOWERCASE_E
&& source_p[3] == 'l' && source_p[3] == LIT_CHAR_LOWERCASE_L
&& source_p[1] == 'v' && source_p[1] == LIT_CHAR_LOWERCASE_V
&& source_p[2] == 'a') && source_p[2] == LIT_CHAR_LOWERCASE_A)
{ {
context_p->lit_object.type = LEXER_LITERAL_OBJECT_EVAL; context_p->lit_object.type = LEXER_LITERAL_OBJECT_EVAL;
} }
if (literal_p->length == 9 if (literal_p->length == 9
&& source_p[0] == 'a' && source_p[0] == LIT_CHAR_LOWERCASE_A
&& source_p[8] == 's' && source_p[8] == LIT_CHAR_LOWERCASE_S
&& memcmp (source_p + 1, "rgument", 7) == 0) && memcmp (source_p + 1, "rgument", 7) == 0)
{ {
context_p->lit_object.type = LEXER_LITERAL_OBJECT_ARGUMENTS; context_p->lit_object.type = LEXER_LITERAL_OBJECT_ARGUMENTS;
@@ -1543,7 +1542,7 @@ lexer_construct_number_object (parser_context_t *context_p, /**< context */
do do
{ {
src_p++; src_p++;
num = num * 8 + (ecma_number_t) (*src_p - '0'); num = num * 8 + (ecma_number_t) (*src_p - LIT_CHAR_0);
} }
while (src_p < src_end_p); while (src_p < src_end_p);
} }
@@ -1677,7 +1676,7 @@ lexer_construct_regexp_object (parser_context_t *context_p, /**< context */
parser_raise_error (context_p, PARSER_ERR_UNTERMINATED_REGEXP); parser_raise_error (context_p, PARSER_ERR_UNTERMINATED_REGEXP);
} }
if (!in_class && source_p[0] == '/') if (!in_class && source_p[0] == LIT_CHAR_SLASH)
{ {
regex_end_p = source_p; regex_end_p = source_p;
source_p++; source_p++;
@@ -1705,24 +1704,24 @@ lexer_construct_regexp_object (parser_context_t *context_p, /**< context */
column--; column--;
break; break;
} }
case '[': case LIT_CHAR_LEFT_SQUARE:
{ {
in_class = PARSER_TRUE; in_class = PARSER_TRUE;
break; break;
} }
case ']': case LIT_CHAR_RIGHT_SQUARE:
{ {
in_class = PARSER_FALSE; in_class = PARSER_FALSE;
break; break;
} }
case '\\': case LIT_CHAR_BACKSLASH:
{ {
if (source_p + 1 >= source_end_p) if (source_p + 1 >= source_end_p)
{ {
parser_raise_error (context_p, PARSER_ERR_UNTERMINATED_REGEXP); parser_raise_error (context_p, PARSER_ERR_UNTERMINATED_REGEXP);
} }
if (source_p[1] >= 0x20 && source_p[1] <= 0x7f) if (source_p[1] >= 0x20 && source_p[1] <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
{ {
source_p++; source_p++;
column++; column++;
@@ -1740,21 +1739,20 @@ lexer_construct_regexp_object (parser_context_t *context_p, /**< context */
} }
} }
/* TODO: This is duplicate of 're_parse_regexp_flags'. Move this to a helper function. */
current_flags = 0; current_flags = 0;
while (source_p < source_end_p) while (source_p < source_end_p)
{ {
uint32_t flag = 0; uint32_t flag = 0;
if (source_p[0] == 'g') if (source_p[0] == LIT_CHAR_LOWERCASE_G)
{ {
flag = RE_FLAG_GLOBAL; flag = RE_FLAG_GLOBAL;
} }
else if (source_p[0] == 'i') else if (source_p[0] == LIT_CHAR_LOWERCASE_I)
{ {
flag = RE_FLAG_IGNORE_CASE; flag = RE_FLAG_IGNORE_CASE;
} }
else if (source_p[0] == 'm') else if (source_p[0] == LIT_CHAR_LOWERCASE_M)
{ {
flag = RE_FLAG_MULTILINE; flag = RE_FLAG_MULTILINE;
} }
@@ -1775,7 +1773,7 @@ lexer_construct_regexp_object (parser_context_t *context_p, /**< context */
} }
if (source_p < source_end_p if (source_p < source_end_p
&& util_is_identifier_part (source_p)) && lit_char_is_identifier_part (source_p))
{ {
parser_raise_error (context_p, PARSER_ERR_UNKNOWN_REGEXP_FLAG); parser_raise_error (context_p, PARSER_ERR_UNKNOWN_REGEXP_FLAG);
} }
@@ -1859,7 +1857,7 @@ lexer_expect_identifier (parser_context_t *context_p, /**< context */
context_p->token.column = context_p->column; context_p->token.column = context_p->column;
if (context_p->source_p < context_p->source_end_p if (context_p->source_p < context_p->source_end_p
&& (util_is_identifier_start (context_p->source_p) || context_p->source_p[0] == '\\')) && (lit_char_is_identifier_start (context_p->source_p) || context_p->source_p[0] == LIT_CHAR_BACKSLASH))
{ {
lexer_parse_identifier (context_p, literal_type != LEXER_STRING_LITERAL); lexer_parse_identifier (context_p, literal_type != LEXER_STRING_LITERAL);
@@ -1922,7 +1920,7 @@ lexer_expect_object_literal_id (parser_context_t *context_p, /**< context */
{ {
int create_literal_object = PARSER_FALSE; int create_literal_object = PARSER_FALSE;
if (util_is_identifier_start (context_p->source_p) || context_p->source_p[0] == '\\') if (lit_char_is_identifier_start (context_p->source_p) || context_p->source_p[0] == LIT_CHAR_BACKSLASH)
{ {
lexer_parse_identifier (context_p, PARSER_FALSE); lexer_parse_identifier (context_p, PARSER_FALSE);
@@ -1932,14 +1930,14 @@ lexer_expect_object_literal_id (parser_context_t *context_p, /**< context */
skip_spaces (context_p); skip_spaces (context_p);
if (context_p->source_p < context_p->source_end_p if (context_p->source_p < context_p->source_end_p
&& context_p->source_p[0] != ':') && context_p->source_p[0] != LIT_CHAR_COLON)
{ {
if (lexer_same_identifiers (&context_p->token.lit_location, &lexer_get_literal)) if (lexer_compare_identifier_to_current (context_p, &lexer_get_literal))
{ {
context_p->token.type = LEXER_PROPERTY_GETTER; context_p->token.type = LEXER_PROPERTY_GETTER;
return; return;
} }
else if (lexer_same_identifiers (&context_p->token.lit_location, &lexer_set_literal)) else if (lexer_compare_identifier_to_current (context_p, &lexer_set_literal))
{ {
context_p->token.type = LEXER_PROPERTY_SETTER; context_p->token.type = LEXER_PROPERTY_SETTER;
return; return;
@@ -1949,13 +1947,13 @@ lexer_expect_object_literal_id (parser_context_t *context_p, /**< context */
create_literal_object = PARSER_TRUE; create_literal_object = PARSER_TRUE;
} }
else if (context_p->source_p[0] == '"' else if (context_p->source_p[0] == LIT_CHAR_DOUBLE_QUOTE
|| context_p->source_p[0] == '\'') || context_p->source_p[0] == LIT_CHAR_SINGLE_QUOTE)
{ {
lexer_parse_string (context_p); lexer_parse_string (context_p);
create_literal_object = PARSER_TRUE; create_literal_object = PARSER_TRUE;
} }
else if (!must_be_identifier && context_p->source_p[0] == '}') else if (!must_be_identifier && context_p->source_p[0] == LIT_CHAR_RIGHT_BRACE)
{ {
context_p->token.type = LEXER_RIGHT_BRACE; context_p->token.type = LEXER_RIGHT_BRACE;
context_p->source_p += 1; context_p->source_p += 1;
@@ -1966,14 +1964,14 @@ lexer_expect_object_literal_id (parser_context_t *context_p, /**< context */
{ {
const uint8_t *char_p = context_p->source_p; const uint8_t *char_p = context_p->source_p;
if (char_p[0] == '.') if (char_p[0] == LIT_CHAR_DOT)
{ {
char_p++; char_p++;
} }
if (char_p < context_p->source_end_p if (char_p < context_p->source_end_p
&& char_p[0] >= '0' && char_p[0] >= LIT_CHAR_0
&& char_p[0] <= '9') && char_p[0] <= LIT_CHAR_9)
{ {
lexer_parse_number (context_p); lexer_parse_number (context_p);
lexer_construct_number_object (context_p, PARSER_FALSE, PARSER_FALSE); lexer_construct_number_object (context_p, PARSER_FALSE, PARSER_FALSE);
@@ -2005,7 +2003,7 @@ lexer_scan_identifier (parser_context_t *context_p, /**< context */
context_p->token.column = context_p->column; context_p->token.column = context_p->column;
if (context_p->source_p < context_p->source_end_p if (context_p->source_p < context_p->source_end_p
&& (util_is_identifier_start (context_p->source_p) || context_p->source_p[0] == '\\')) && (lit_char_is_identifier_start (context_p->source_p) || context_p->source_p[0] == LIT_CHAR_BACKSLASH))
{ {
lexer_parse_identifier (context_p, PARSER_FALSE); lexer_parse_identifier (context_p, PARSER_FALSE);
@@ -2014,13 +2012,13 @@ lexer_scan_identifier (parser_context_t *context_p, /**< context */
skip_spaces (context_p); skip_spaces (context_p);
if (context_p->source_p < context_p->source_end_p if (context_p->source_p < context_p->source_end_p
&& context_p->source_p[0] != ':') && context_p->source_p[0] != LIT_CHAR_COLON)
{ {
if (lexer_same_identifiers (&context_p->token.lit_location, &lexer_get_literal)) if (lexer_compare_identifier_to_current (context_p, &lexer_get_literal))
{ {
context_p->token.type = LEXER_PROPERTY_GETTER; context_p->token.type = LEXER_PROPERTY_GETTER;
} }
else if (lexer_same_identifiers (&context_p->token.lit_location, &lexer_set_literal)) else if (lexer_compare_identifier_to_current (context_p, &lexer_set_literal))
{ {
context_p->token.type = LEXER_PROPERTY_SETTER; context_p->token.type = LEXER_PROPERTY_SETTER;
} }
@@ -2044,44 +2042,16 @@ lexer_scan_identifier (parser_context_t *context_p, /**< context */
} /* lexer_scan_identifier */ } /* lexer_scan_identifier */
/** /**
* Converts a "\uxxxx" sequence into a unicode character * Compares the given identifier to that which is the current token
* * in the parser context.
* @return the decoded 16 bit unicode character
*/
static ecma_char_t
lexer_decode_unicode_sequence (const uint8_t *source_p) /**< source pointer */
{
ecma_char_t chr = 0;
const uint8_t *source_end_p = source_p + 6;
source_p += 2;
do
{
uint8_t byte = *source_p++;
chr = (ecma_char_t) (chr << 4);
if (byte <= '9')
{
chr = (ecma_char_t) (chr + byte - '0');
}
else
{
chr = (ecma_char_t) (chr + LEXER_TO_ASCII_LOWERCASE (byte) - ('a' - 10));
}
}
while (source_p < source_end_p);
return chr;
} /* lexer_decode_unicode_sequence */
/**
* Compares two identifiers.
* *
* @return non-zero if the input identifiers are the same * @return non-zero if the input identifiers are the same
*/ */
int int
lexer_same_identifiers (lexer_lit_location_t *left, /**< left identifier */ lexer_compare_identifier_to_current (parser_context_t *context_p, /**< context */
const lexer_lit_location_t *right) /**< right identifier */ const lexer_lit_location_t *right) /**< identifier */
{ {
lexer_lit_location_t *left = &context_p->token.lit_location;
const uint8_t *left_p; const uint8_t *left_p;
const uint8_t *right_p; const uint8_t *right_p;
size_t count; size_t count;
@@ -2108,7 +2078,7 @@ lexer_same_identifiers (lexer_lit_location_t *left, /**< left identifier */
size_t utf8_len, offset; size_t utf8_len, offset;
/* Backslash cannot be part of a multibyte UTF-8 character. */ /* Backslash cannot be part of a multibyte UTF-8 character. */
if (*left_p != '\\' && *right_p != '\\') if (*left_p != LIT_CHAR_BACKSLASH && *right_p != LIT_CHAR_BACKSLASH)
{ {
if (*left_p++ != *right_p++) if (*left_p++ != *right_p++)
{ {
@@ -2118,23 +2088,23 @@ lexer_same_identifiers (lexer_lit_location_t *left, /**< left identifier */
continue; continue;
} }
if (*left_p == '\\' && *right_p == '\\') if (*left_p == LIT_CHAR_BACKSLASH && *right_p == LIT_CHAR_BACKSLASH)
{ {
uint16_t left_chr = lexer_decode_unicode_sequence (left_p); uint16_t left_chr = lexer_hex_to_character (context_p, left_p, 6);
if (left_chr != lexer_decode_unicode_sequence (right_p)) if (left_chr != lexer_hex_to_character (context_p, right_p, 6))
{ {
return PARSER_FALSE; return PARSER_FALSE;
} }
left_p += 6; left_p += 6;
right_p += 6; right_p += 6;
count += util_get_utf8_length (left_chr); count += lit_char_get_utf8_length (left_chr);
continue; continue;
} }
/* One character is encoded as unicode sequence. */ /* One character is encoded as unicode sequence. */
if (*right_p == '\\') if (*right_p == LIT_CHAR_BACKSLASH)
{ {
/* The pointers can be swapped. */ /* The pointers can be swapped. */
const uint8_t *swap_p = left_p; const uint8_t *swap_p = left_p;
@@ -2142,7 +2112,7 @@ lexer_same_identifiers (lexer_lit_location_t *left, /**< left identifier */
right_p = swap_p; right_p = swap_p;
} }
utf8_len = util_to_utf8_bytes (utf8_buf, lexer_decode_unicode_sequence (left_p)); utf8_len = lit_char_to_utf8_bytes (utf8_buf, lexer_hex_to_character (context_p, left_p, 6));
JERRY_ASSERT (utf8_len > 0); JERRY_ASSERT (utf8_len > 0);
count -= utf8_len; count -= utf8_len;
offset = 0; offset = 0;
@@ -2162,7 +2132,7 @@ lexer_same_identifiers (lexer_lit_location_t *left, /**< left identifier */
while (count > 0); while (count > 0);
return PARSER_TRUE; return PARSER_TRUE;
} /* lexer_same_identifiers */ } /* lexer_compare_identifier_to_current */
/** /**
* @} * @}
+2 -3
View File
@@ -171,7 +171,8 @@ typedef enum
} lexer_token_type_t; } lexer_token_type_t;
#define LEXER_NEWLINE_LS_PS_BYTE_1 0xe2 #define LEXER_NEWLINE_LS_PS_BYTE_1 0xe2
#define LEXER_NEWLINE_LS_PS_BYTE_23(source) ((source)[1] == 0x80 && ((source)[2] | 0x1) == 0xa9) #define LEXER_NEWLINE_LS_PS_BYTE_23(source) \
((source)[1] == LIT_UTF8_2_BYTE_CODE_POINT_MIN && ((source)[2] | 0x1) == 0xa9)
#define LEXER_UTF8_4BYTE_START 0xf0 #define LEXER_UTF8_4BYTE_START 0xf0
#define LEXER_IS_LEFT_BRACKET(type) \ #define LEXER_IS_LEFT_BRACKET(type) \
@@ -192,8 +193,6 @@ typedef enum
#define LEXER_BINARY_LVALUE_OP_TOKEN_TO_OPCODE(token_type) \ #define LEXER_BINARY_LVALUE_OP_TOKEN_TO_OPCODE(token_type) \
((cbc_opcode_t) ((((token_type) - LEXER_ASSIGN_ADD) * 2) + CBC_ASSIGN_ADD)) ((cbc_opcode_t) ((((token_type) - LEXER_ASSIGN_ADD) * 2) + CBC_ASSIGN_ADD))
#define LEXER_TO_ASCII_LOWERCASE(character) ((character) | 0x20)
/** /**
* Lexer literal object types. * Lexer literal object types.
*/ */
+2 -1
View File
@@ -351,12 +351,13 @@ void parser_set_continues_to_current_position (parser_context_t *, parser_branch
void lexer_next_token (parser_context_t *); void lexer_next_token (parser_context_t *);
void lexer_expect_identifier (parser_context_t *, uint8_t); void lexer_expect_identifier (parser_context_t *, uint8_t);
void lexer_scan_identifier (parser_context_t *, int); void lexer_scan_identifier (parser_context_t *, int);
ecma_char_t lexer_hex_to_character (parser_context_t *context_p, const uint8_t *source_p, int length);
void lexer_expect_object_literal_id (parser_context_t *, int); void lexer_expect_object_literal_id (parser_context_t *, int);
void lexer_construct_literal_object (parser_context_t *, lexer_lit_location_t *, uint8_t); void lexer_construct_literal_object (parser_context_t *, lexer_lit_location_t *, uint8_t);
int lexer_construct_number_object (parser_context_t *, int, int); int lexer_construct_number_object (parser_context_t *, int, int);
void lexer_construct_function_object (parser_context_t *, uint32_t); void lexer_construct_function_object (parser_context_t *, uint32_t);
void lexer_construct_regexp_object (parser_context_t *, int); void lexer_construct_regexp_object (parser_context_t *, int);
int lexer_same_identifiers (lexer_lit_location_t *, const lexer_lit_location_t *); int lexer_compare_identifier_to_current (parser_context_t *, const lexer_lit_location_t *);
/* Parser functions. */ /* Parser functions. */
+3 -3
View File
@@ -1327,7 +1327,7 @@ parser_parse_break_statement (parser_context_t *context_p) /**< context */
parser_stack_iterator_skip (&iterator, 1); parser_stack_iterator_skip (&iterator, 1);
parser_stack_iterator_read (&iterator, &label_statement, sizeof (parser_label_statement_t)); parser_stack_iterator_read (&iterator, &label_statement, sizeof (parser_label_statement_t));
if (lexer_same_identifiers (&context_p->token.lit_location, &label_statement.label_ident)) if (lexer_compare_identifier_to_current (context_p, &label_statement.label_ident))
{ {
label_statement.break_list_p = parser_emit_cbc_forward_branch_item (context_p, label_statement.break_list_p = parser_emit_cbc_forward_branch_item (context_p,
opcode, opcode,
@@ -1422,7 +1422,7 @@ parser_parse_continue_statement (parser_context_t *context_p) /**< context */
parser_stack_iterator_skip (&iterator, 1); parser_stack_iterator_skip (&iterator, 1);
parser_stack_iterator_read (&iterator, &label_statement, sizeof (parser_label_statement_t)); parser_stack_iterator_read (&iterator, &label_statement, sizeof (parser_label_statement_t));
if (lexer_same_identifiers (&context_p->token.lit_location, &label_statement.label_ident)) if (lexer_compare_identifier_to_current (context_p, &label_statement.label_ident))
{ {
parser_loop_statement_t loop; parser_loop_statement_t loop;
@@ -1529,7 +1529,7 @@ parser_parse_label (parser_context_t *context_p, /**< context */
parser_stack_iterator_read (&iterator, &label_statement, sizeof (parser_label_statement_t)); parser_stack_iterator_read (&iterator, &label_statement, sizeof (parser_label_statement_t));
parser_stack_iterator_skip (&iterator, sizeof (parser_label_statement_t)); parser_stack_iterator_skip (&iterator, sizeof (parser_label_statement_t));
if (lexer_same_identifiers (label_literal_p, &label_statement.label_ident)) if (lexer_compare_identifier_to_current (context_p, &label_statement.label_ident))
{ {
parser_raise_error (context_p, PARSER_ERR_DUPLICATED_LABEL); parser_raise_error (context_p, PARSER_ERR_DUPLICATED_LABEL);
} }
+84
View File
@@ -0,0 +1,84 @@
/* Copyright 2015 Samsung Electronics Co., Ltd.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "ecma-helpers.h"
#include "lit-strings.h"
#include "ecma-init-finalize.h"
#include "lit-literal.h"
#include "lit-char-helpers.h"
#include "js-parser-internal.h"
#include "test-common.h"
int
main (int __attr_unused___ argc,
char __attr_unused___ **argv)
{
TEST_INIT ();
mem_init ();
lit_init ();
ecma_init ();
const uint8_t _1_byte_long1[] = "\\u007F";
const uint8_t _1_byte_long2[] = "\\u0000";
const uint8_t _1_byte_long3[] = "\\u0065";
const uint8_t _2_byte_long1[] = "\\u008F";
const uint8_t _2_byte_long2[] = "\\u00FF";
const uint8_t _2_byte_long3[] = "\\u07FF";
const uint8_t _3_byte_long1[] = "\\u08FF";
const uint8_t _3_byte_long2[] = "\\u0FFF";
const uint8_t _3_byte_long3[] = "\\uFFFF";
size_t length;
// test 1-byte-long unicode sequences
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _1_byte_long1 + 2, 4));
JERRY_ASSERT (length == 1);
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _1_byte_long2 + 2, 4));
JERRY_ASSERT (length == 1);
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _1_byte_long3 + 2, 4));
JERRY_ASSERT (length == 1);
// test 2-byte-long unicode sequences
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _2_byte_long1 + 2, 4));
JERRY_ASSERT (length == 2);
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _2_byte_long2 + 2, 4));
JERRY_ASSERT (length == 2);
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _2_byte_long3 + 2, 4));
JERRY_ASSERT (length == 2);
// test 3-byte-long unicode sequences
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _3_byte_long1 + 2, 4));
JERRY_ASSERT (length != 2);
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _3_byte_long2 + 2, 4));
JERRY_ASSERT (length == 3);
length = lit_char_get_utf8_length (lexer_hex_to_character (0, _3_byte_long3 + 2, 4));
JERRY_ASSERT (length == 3);
ecma_finalize ();
lit_finalize ();
mem_finalize (true);
return 0;
} /* main */