/* Copyright 2014-2015 Samsung Electronics Co., Ltd. * Copyright 2015 University of Szeged * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "ecma-alloc.h" #include "ecma-builtins.h" #include "ecma-conversion.h" #include "ecma-eval.h" #include "ecma-exceptions.h" #include "ecma-gc.h" #include "ecma-globals.h" #include "ecma-helpers.h" #include "ecma-try-catch-macro.h" #include "jrt.h" #include "lit-char-helpers.h" #include "lit-magic-strings.h" #include "lit-strings.h" #include "vm.h" #include "jrt-libc-includes.h" #define ECMA_BUILTINS_INTERNAL #include "ecma-builtins-internal.h" #define BUILTIN_INC_HEADER_NAME "ecma-builtin-global.inc.h" #define BUILTIN_UNDERSCORED_ID global #include "ecma-builtin-internal-routines-template.inc.h" /** \addtogroup ecma ECMA * @{ * * \addtogroup ecmabuiltins * @{ * * \addtogroup global ECMA Global object built-in * @{ */ /** * The implementation-defined Global object's 'print' routine * * The routine converts all of its arguments to strings and outputs them using 'printf'. * * Code points, with except of character, that are representable with one utf8-byte * are outputted as is, using '%c' format argument, and other code points are outputted as '\uhhll', * where hh and ll are values of code point's high and low bytes, correspondingly. * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_print (ecma_value_t this_arg __attr_unused___, /**< this argument */ const ecma_value_t args[], /**< arguments list */ ecma_length_t args_number) /**< number of arguments */ { ecma_completion_value_t ret_value = ecma_make_empty_completion_value (); /* * TODO: * Move the 'print' routine out of engine core. */ for (ecma_length_t arg_index = 0; ecma_is_completion_value_empty (ret_value) && arg_index < args_number; arg_index++) { ECMA_TRY_CATCH (str_value, ecma_op_to_string (args[arg_index]), ret_value); ecma_string_t *str_p = ecma_get_string_from_value (str_value); lit_utf8_size_t utf8_str_size = ecma_string_get_size (str_p); MEM_DEFINE_LOCAL_ARRAY (utf8_str_p, utf8_str_size, lit_utf8_byte_t); ssize_t actual_sz = ecma_string_to_utf8_string (str_p, utf8_str_p, (ssize_t) utf8_str_size); JERRY_ASSERT (actual_sz == (ssize_t) utf8_str_size); lit_utf8_iterator_t str_iter = lit_utf8_iterator_create (utf8_str_p, utf8_str_size); while (!lit_utf8_iterator_is_eos (&str_iter)) { ecma_char_t code_point = lit_utf8_iterator_read_next (&str_iter); if (code_point == LIT_CHAR_NULL) { printf ("\\u0000"); } else if (code_point <= LIT_UTF8_1_BYTE_CODE_POINT_MAX) { printf ("%c", (char) code_point); } else { JERRY_STATIC_ASSERT (sizeof (code_point) == 2); uint32_t byte_high = (uint32_t) jrt_extract_bit_field (code_point, JERRY_BITSINBYTE, JERRY_BITSINBYTE); uint32_t byte_low = (uint32_t) jrt_extract_bit_field (code_point, 0, JERRY_BITSINBYTE); printf ("\\u%02x%02x", byte_high, byte_low); } } if (arg_index < args_number - 1) { printf (" "); } MEM_FINALIZE_LOCAL_ARRAY (utf8_str_p); ECMA_FINALIZE (str_value); } printf ("\n"); if (ecma_is_completion_value_empty (ret_value)) { ret_value = ecma_make_normal_completion_value (ecma_make_simple_value (ECMA_SIMPLE_VALUE_UNDEFINED)); } return ret_value; } /* ecma_builtin_global_object_print */ /** * The Global object's 'eval' routine * * See also: * ECMA-262 v5, 15.1.2.1 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_eval (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t x) /**< routine's first argument */ { ecma_completion_value_t ret_value = ecma_make_empty_completion_value (); bool is_direct_eval = vm_is_direct_eval_form_call (); /* See also: ECMA-262 v5, 10.1.1 */ bool is_called_from_strict_mode_code; if (is_direct_eval) { is_called_from_strict_mode_code = vm_is_strict_mode (); } else { is_called_from_strict_mode_code = false; } if (!ecma_is_value_string (x)) { /* step 1 */ ret_value = ecma_make_normal_completion_value (ecma_copy_value (x, true)); } else { /* steps 2 to 8 */ ret_value = ecma_op_eval (ecma_get_string_from_value (x), is_direct_eval, is_called_from_strict_mode_code); } return ret_value; } /* ecma_builtin_global_object_eval */ /** * The Global object's 'parseInt' routine * * See also: * ECMA-262 v5, 15.1.2.2 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_parse_int (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t string, /**< routine's first argument */ ecma_value_t radix) /**< routine's second argument */ { ecma_completion_value_t ret_value = ecma_make_empty_completion_value (); /* 1. */ ECMA_TRY_CATCH (string_var, ecma_op_to_string (string), ret_value); ecma_string_t *number_str_p = ecma_get_string_from_value (string_var); lit_utf8_size_t str_size = ecma_string_get_size (number_str_p); if (str_size > 0) { MEM_DEFINE_LOCAL_ARRAY (utf8_string_buff, str_size, lit_utf8_byte_t); ssize_t bytes_copied = ecma_string_to_utf8_string (number_str_p, utf8_string_buff, (ssize_t) str_size); JERRY_ASSERT (bytes_copied >= 0); lit_utf8_iterator_t iter = lit_utf8_iterator_create (utf8_string_buff, str_size); /* 2. Remove leading whitespace. */ lit_utf8_iterator_seek_eos (&iter); lit_utf8_iterator_pos_t start = lit_utf8_iterator_get_pos (&iter); lit_utf8_iterator_pos_t end = lit_utf8_iterator_get_pos (&iter); lit_utf8_iterator_seek_bos (&iter); while (!lit_utf8_iterator_is_eos (&iter)) { ecma_char_t current_char = lit_utf8_iterator_read_next (&iter); if (!lit_char_is_white_space (current_char) && !lit_char_is_line_terminator (current_char)) { lit_utf8_iterator_read_prev (&iter); start = lit_utf8_iterator_get_pos (&iter); break; } } /* 3. */ int sign = 1; /* 4. */ ecma_char_t current = lit_utf8_iterator_read_next (&iter); if (current == LIT_CHAR_MINUS) { sign = -1; } /* 5. */ if (current == LIT_CHAR_MINUS || current == LIT_CHAR_PLUS) { start = lit_utf8_iterator_get_pos (&iter); if (!lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); } } /* 6. */ ECMA_OP_TO_NUMBER_TRY_CATCH (radix_num, radix, ret_value); int32_t rad = ecma_number_to_int32 (radix_num); /* 7.*/ bool strip_prefix = true; /* 8. */ if (rad != 0) { /* 8.a */ if (rad < 2 || rad > 36) { ecma_number_t *ret_num_p = ecma_alloc_number (); *ret_num_p = ecma_number_make_nan (); ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p)); } /* 8.b */ else if (rad != 16) { strip_prefix = false; } } /* 9. */ else { rad = 10; } if (ecma_is_completion_value_empty (ret_value)) { /* 10. */ if (strip_prefix) { if (end.offset - start.offset >= 2 && current == LIT_CHAR_0) { ecma_char_t next = lit_utf8_iterator_peek_next (&iter); if (next == LIT_CHAR_LOWERCASE_X || next == LIT_CHAR_UPPERCASE_X) { /* Skip the 'x' or 'X' characters. */ lit_utf8_iterator_incr (&iter); start = lit_utf8_iterator_get_pos (&iter); rad = 16; } } } /* 11. Check if characters are in [0, Radix - 1]. We also convert them to number values in the process. */ lit_utf8_iterator_seek (&iter, start); while (!lit_utf8_iterator_is_eos (&iter)) { ecma_char_t current_char = lit_utf8_iterator_read_next (&iter); int32_t current_number; if ((current_char >= LIT_CHAR_LOWERCASE_A && current_char <= LIT_CHAR_LOWERCASE_Z)) { current_number = current_char - LIT_CHAR_LOWERCASE_A + 10; } else if ((current_char >= LIT_CHAR_UPPERCASE_A && current_char <= LIT_CHAR_UPPERCASE_Z)) { current_number = current_char - LIT_CHAR_UPPERCASE_A + 10; } else if (lit_char_is_decimal_digit (current_char)) { current_number = current_char - LIT_CHAR_0; } else { /* Not a valid number char, set value to radix so it fails to pass as a valid character. */ current_number = rad; } if (!(current_number < rad)) { lit_utf8_iterator_decr (&iter); end = lit_utf8_iterator_get_pos (&iter); break; } } /* 12. */ if (end.offset - start.offset == 0) { ecma_number_t *ret_num_p = ecma_alloc_number (); *ret_num_p = ecma_number_make_nan (); ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p)); } } if (ecma_is_completion_value_empty (ret_value)) { ecma_number_t *value_p = ecma_alloc_number (); *value_p = 0; ecma_number_t multiplier = 1.0f; /* 13. and 14. */ lit_utf8_iterator_seek (&iter, end); while (lit_utf8_iterator_get_pos (&iter).offset > start.offset) { ecma_char_t current_char = lit_utf8_iterator_read_prev (&iter); ecma_number_t current_number; if ((current_char >= LIT_CHAR_LOWERCASE_A && current_char <= LIT_CHAR_LOWERCASE_Z)) { current_number = (ecma_number_t) current_char - LIT_CHAR_LOWERCASE_A + 10; } else if ((current_char >= LIT_CHAR_UPPERCASE_A && current_char <= LIT_CHAR_UPPERCASE_Z)) { current_number = (ecma_number_t) current_char - LIT_CHAR_UPPERCASE_A + 10; } else if (lit_char_is_decimal_digit (current_char)) { current_number = (ecma_number_t) current_char - LIT_CHAR_0; } else { JERRY_UNREACHABLE (); } *value_p += current_number * multiplier; multiplier *= (ecma_number_t) rad; } /* 15. */ if (sign < 0) { *value_p *= (ecma_number_t) sign; } ret_value = ecma_make_normal_completion_value (ecma_make_number_value (value_p)); } ECMA_OP_TO_NUMBER_FINALIZE (radix_num); MEM_FINALIZE_LOCAL_ARRAY (utf8_string_buff); } else { ecma_number_t *ret_num_p = ecma_alloc_number (); *ret_num_p = ecma_number_make_nan (); ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p)); } ECMA_FINALIZE (string_var); return ret_value; } /* ecma_builtin_global_object_parse_int */ /** * The Global object's 'parseFloat' routine * * See also: * ECMA-262 v5, 15.1.2.3 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_parse_float (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t string) /**< routine's first argument */ { ecma_completion_value_t ret_value = ecma_make_empty_completion_value (); /* 1. */ ECMA_TRY_CATCH (string_var, ecma_op_to_string (string), ret_value); ecma_string_t *number_str_p = ecma_get_string_from_value (string_var); lit_utf8_size_t str_size = ecma_string_get_size (number_str_p); if (str_size > 0) { MEM_DEFINE_LOCAL_ARRAY (utf8_string_buff, str_size, lit_utf8_byte_t); ssize_t bytes_copied = ecma_string_to_utf8_string (number_str_p, utf8_string_buff, (ssize_t) str_size); JERRY_ASSERT (bytes_copied >= 0); lit_utf8_iterator_t iter = lit_utf8_iterator_create (utf8_string_buff, str_size); lit_utf8_iterator_seek_eos (&iter); lit_utf8_iterator_pos_t start = lit_utf8_iterator_get_pos (&iter); lit_utf8_iterator_pos_t end = lit_utf8_iterator_get_pos (&iter); lit_utf8_iterator_seek_bos (&iter); /* 2. Find first non whitespace char and set starting position. */ while (!lit_utf8_iterator_is_eos (&iter)) { ecma_char_t current_char = lit_utf8_iterator_read_next (&iter); if (!lit_char_is_white_space (current_char) && !lit_char_is_line_terminator (current_char)) { lit_utf8_iterator_decr (&iter); start = lit_utf8_iterator_get_pos (&iter); break; } } bool sign = false; ecma_char_t current; if (!lit_utf8_iterator_is_eos (&iter)) { /* Check if sign is present. */ current = lit_utf8_iterator_read_next (&iter); if (current == LIT_CHAR_MINUS) { sign = true; } if (current == LIT_CHAR_MINUS || current == LIT_CHAR_PLUS) { /* Set starting position to be after the sign character. */ start = lit_utf8_iterator_get_pos (&iter); } else { lit_utf8_iterator_decr (&iter); } } ecma_number_t *ret_num_p = ecma_alloc_number (); const lit_utf8_byte_t *infinity_utf8_str_p = lit_get_magic_string_utf8 (LIT_MAGIC_STRING_INFINITY_UL); lit_utf8_iterator_t infinity_iter = lit_utf8_iterator_create (infinity_utf8_str_p, sizeof (*infinity_utf8_str_p)); JERRY_ASSERT (!lit_utf8_iterator_is_eos (&infinity_iter)); /* Check if string is equal to "Infinity". */ while (!lit_utf8_iterator_is_eos (&iter) && (lit_utf8_iterator_read_next (&iter) == lit_utf8_iterator_read_next (&infinity_iter))) { if (lit_utf8_iterator_is_eos (&infinity_iter)) { /* String matched Infinity. */ *ret_num_p = ecma_number_make_infinity (sign); ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p)); break; } } /* Reset to starting position. */ lit_utf8_iterator_seek (&iter, start); if (ecma_is_completion_value_empty (ret_value) && !lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); bool has_whole_part = false; bool has_fraction_part = false; /* Check digits of whole part. */ if (lit_char_is_decimal_digit (current)) { has_whole_part = true; while (!lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); if (!lit_char_is_decimal_digit (current)) { lit_utf8_iterator_decr (&iter); break; } } } else { lit_utf8_iterator_decr (&iter); } /* Set end position to the end of whole part. */ end = lit_utf8_iterator_get_pos (&iter); if (!lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); } /* Check decimal point. */ if (current == LIT_CHAR_DOT && !lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); if (lit_char_is_decimal_digit (current)) { has_fraction_part = true; /* Check digits of fractional part. */ while (!lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); if (!lit_char_is_decimal_digit (current)) { lit_utf8_iterator_decr (&iter); break; } } /* Set end position to end of fraction part. */ end = lit_utf8_iterator_get_pos (&iter); } else { lit_utf8_iterator_decr (&iter); } } else { lit_utf8_iterator_decr (&iter); } if (!lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); } /* Check exponent. */ if ((current == LIT_CHAR_LOWERCASE_E || current == LIT_CHAR_UPPERCASE_E) && (has_whole_part || has_fraction_part) && !lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); /* Check sign of exponent. */ if ((current == LIT_CHAR_PLUS || current == LIT_CHAR_MINUS) && !lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); } if (lit_char_is_decimal_digit (current)) { /* Check digits of exponent part. */ while (!lit_utf8_iterator_is_eos (&iter)) { current = lit_utf8_iterator_read_next (&iter); if (!lit_char_is_decimal_digit (current)) { lit_utf8_iterator_decr (&iter); break; } } /* Set end position to end of exponent part. */ end = lit_utf8_iterator_get_pos (&iter); } } else { lit_utf8_iterator_decr (&iter); } /* String did not contain a valid number. */ if (start.offset == end.offset) { *ret_num_p = ecma_number_make_nan (); ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p)); } else { /* 5. */ *ret_num_p = ecma_utf8_string_to_number (utf8_string_buff + start.offset, (lit_utf8_size_t) (end.offset - start.offset)); if (sign) { *ret_num_p *= -1; } ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p)); } } /* String ended after sign character, or was empty after removing leading whitespace. */ else if (ecma_is_completion_value_empty (ret_value)) { *ret_num_p = ecma_number_make_nan (); ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p)); } MEM_FINALIZE_LOCAL_ARRAY (utf8_string_buff); } /* String length is zero. */ else { ecma_number_t *ret_num_p = ecma_alloc_number (); *ret_num_p = ecma_number_make_nan (); ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p)); } ECMA_FINALIZE (string_var); return ret_value; } /* ecma_builtin_global_object_parse_float */ /** * The Global object's 'isNaN' routine * * See also: * ECMA-262 v5, 15.1.2.4 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_is_nan (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t arg) /**< routine's first argument */ { ecma_completion_value_t ret_value = ecma_make_empty_completion_value (); ECMA_OP_TO_NUMBER_TRY_CATCH (arg_num, arg, ret_value); bool is_nan = ecma_number_is_nan (arg_num); ret_value = ecma_make_simple_completion_value (is_nan ? ECMA_SIMPLE_VALUE_TRUE : ECMA_SIMPLE_VALUE_FALSE); ECMA_OP_TO_NUMBER_FINALIZE (arg_num); return ret_value; } /* ecma_builtin_global_object_is_nan */ /** * The Global object's 'isFinite' routine * * See also: * ECMA-262 v5, 15.1.2.5 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_is_finite (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t arg) /**< routine's first argument */ { ecma_completion_value_t ret_value = ecma_make_empty_completion_value (); ECMA_OP_TO_NUMBER_TRY_CATCH (arg_num, arg, ret_value); bool is_finite = !(ecma_number_is_nan (arg_num) || ecma_number_is_infinity (arg_num)); ret_value = ecma_make_simple_completion_value (is_finite ? ECMA_SIMPLE_VALUE_TRUE : ECMA_SIMPLE_VALUE_FALSE); ECMA_OP_TO_NUMBER_FINALIZE (arg_num); return ret_value; } /* ecma_builtin_global_object_is_finite */ /** * Helper function to check whether a character is in a character bitset. * * @return true if the character is in the character bitset. */ static bool ecma_builtin_global_object_character_is_in (uint32_t character, /**< character */ uint8_t *bitset) /**< character set */ { JERRY_ASSERT (character < 128); return (bitset[character >> 3] & (1 << (character & 0x7))) != 0; } /* ecma_builtin_global_object_character_is_in */ /* * Unescaped URI characters bitset: * One bit for each character between 0 - 127. * Bit is set if the character is in the unescaped URI set. */ static uint8_t unescaped_uri_set[16] = { 0x0, 0x0, 0x0, 0x0, 0xda, 0xff, 0xff, 0xaf, 0xff, 0xff, 0xff, 0x87, 0xfe, 0xff, 0xff, 0x47 }; /* * Unescaped URI component characters bitset: * One bit for each character between 0 - 127. * Bit is set if the character is in the unescaped component URI set. */ static uint8_t unescaped_uri_component_set[16] = { 0x0, 0x0, 0x0, 0x0, 0x82, 0x67, 0xff, 0x3, 0xfe, 0xff, 0xff, 0x87, 0xfe, 0xff, 0xff, 0x47 }; /* * Format is a percent sign followed by two hex digits. */ #define URI_ENCODED_BYTE_SIZE (3) /* * These two types shows whether the byte is present in * the original stream or decoded from a %xx sequence. */ #define URI_DECODE_ORIGINAL_BYTE 0 #define URI_DECODE_DECODED_BYTE 1 /** * Helper function to decode URI. * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_decode_uri_helper (ecma_value_t uri __attr_unused___, /**< uri argument */ uint8_t *reserved_uri_bitset) /**< reserved characters bitset */ { ecma_completion_value_t ret_value = ecma_make_empty_completion_value (); ECMA_TRY_CATCH (string, ecma_op_to_string (uri), ret_value); JERRY_ASSERT (ecma_is_value_string (string)); ecma_string_t *input_string_p = ecma_get_string_from_value (string); lit_utf8_size_t input_size = ecma_string_get_size (input_string_p); MEM_DEFINE_LOCAL_ARRAY (input_start_p, input_size + 1, lit_utf8_byte_t); ecma_string_to_utf8_string (input_string_p, input_start_p, (ssize_t) (input_size)); input_start_p[input_size] = LIT_BYTE_NULL; lit_utf8_byte_t *input_char_p = input_start_p; lit_utf8_byte_t *input_end_p = input_start_p + input_size; lit_utf8_size_t output_size = 0; /* * The URI decoding has two major phases: first we validate the input, * and compute the length of the output, then we decode the input. */ while (input_char_p < input_end_p) { /* * We expect that the input is a valid UTF-8 sequence, * so characters >= 0x80 can be let through. */ if (*input_char_p != '%') { output_size++; input_char_p++; continue; } lit_code_point_t decoded_byte; if (!lit_read_code_point_from_hex (input_char_p + 1, 2, &decoded_byte)) { ret_value = ecma_make_throw_obj_completion_value (ecma_new_standard_error (ECMA_ERROR_URI)); break; } input_char_p += URI_ENCODED_BYTE_SIZE; if (decoded_byte <= LIT_UTF8_1_BYTE_CODE_POINT_MAX) { /* * We don't decode those bytes, which are part of reserved_uri_bitset * but not part of unescaped_uri_component_set. */ if (ecma_builtin_global_object_character_is_in (decoded_byte, reserved_uri_bitset) && !ecma_builtin_global_object_character_is_in (decoded_byte, unescaped_uri_component_set)) { output_size += URI_ENCODED_BYTE_SIZE; } else { output_size++; } } else { output_size++; } } if (ecma_is_completion_value_empty (ret_value)) { MEM_DEFINE_LOCAL_ARRAY (output_start_p, output_size * 2, lit_utf8_byte_t); input_char_p = input_start_p; lit_utf8_byte_t *output_char_p = output_start_p; lit_utf8_byte_t *output_type_p = output_start_p + output_size; while (input_char_p < input_end_p) { /* Input decode. */ if (*input_char_p != '%') { *output_type_p++ = URI_DECODE_ORIGINAL_BYTE; *output_char_p = *input_char_p; output_char_p++; input_char_p++; continue; } *output_type_p++ = URI_DECODE_DECODED_BYTE; lit_code_point_t decoded_byte; lit_read_code_point_from_hex (input_char_p + 1, 2, &decoded_byte); input_char_p += URI_ENCODED_BYTE_SIZE; if (decoded_byte <= LIT_UTF8_1_BYTE_CODE_POINT_MAX) { if (ecma_builtin_global_object_character_is_in (decoded_byte, reserved_uri_bitset) && !ecma_builtin_global_object_character_is_in (decoded_byte, unescaped_uri_component_set)) { *output_char_p = '%'; output_char_p++; input_char_p -= 2; } else { *output_char_p = (lit_utf8_byte_t) decoded_byte; output_char_p++; } } else { *output_char_p = (lit_utf8_byte_t) decoded_byte; output_char_p++; } } JERRY_ASSERT (output_start_p + output_size == output_char_p); bool valid_utf8 = lit_is_utf8_string_valid (output_start_p, output_size); if (valid_utf8) { lit_utf8_iterator_t characters = lit_utf8_iterator_create (output_start_p, output_size); output_type_p = output_start_p + output_size; while (!lit_utf8_iterator_is_eos (&characters)) { bool original_byte = output_type_p[characters.buf_pos.offset] == URI_DECODE_ORIGINAL_BYTE; ecma_char_t character = lit_utf8_iterator_read_next (&characters); /* Surrogate fragments are allowed in JS, but not accepted by URI decoding. */ if (!original_byte) { if (lit_is_code_unit_high_surrogate (character)) { /* Note: stray high/low surrogate pairs are not allowed in the stream. */ if (lit_utf8_iterator_is_eos (&characters)) { valid_utf8 = false; break; } if (output_type_p[characters.buf_pos.offset] == URI_DECODE_ORIGINAL_BYTE || !lit_is_code_unit_low_surrogate (lit_utf8_iterator_read_next (&characters))) { valid_utf8 = false; break; } } else if (lit_is_code_unit_low_surrogate (character)) { valid_utf8 = false; break; } } } } if (valid_utf8) { ecma_string_t *output_string_p = ecma_new_ecma_string_from_utf8 (output_start_p, output_size); ret_value = ecma_make_normal_completion_value (ecma_make_string_value (output_string_p)); } else { ret_value = ecma_make_throw_obj_completion_value (ecma_new_standard_error (ECMA_ERROR_URI)); } MEM_FINALIZE_LOCAL_ARRAY (output_start_p); } MEM_FINALIZE_LOCAL_ARRAY (input_start_p); ECMA_FINALIZE (string); return ret_value; } /* ecma_builtin_global_object_decode_uri_helper */ /** * The Global object's 'decodeURI' routine * * See also: * ECMA-262 v5, 15.1.3.1 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_decode_uri (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t encoded_uri) /**< routine's first argument */ { return ecma_builtin_global_object_decode_uri_helper (encoded_uri, unescaped_uri_set); } /* ecma_builtin_global_object_decode_uri */ /** * The Global object's 'decodeURIComponent' routine * * See also: * ECMA-262 v5, 15.1.3.2 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_decode_uri_component (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t encoded_uri_component) /**< routine's * first argument */ { return ecma_builtin_global_object_decode_uri_helper (encoded_uri_component, unescaped_uri_component_set); } /* ecma_builtin_global_object_decode_uri_component */ /** * Helper function to encode byte as hexadecimal values. */ static void ecma_builtin_global_object_byte_to_hex (lit_utf8_byte_t *dest_p, /**< destination pointer */ uint32_t byte) /**< value */ { JERRY_ASSERT (byte < 256); dest_p[0] = '%'; ecma_char_t hex_digit = (ecma_char_t) (byte >> 4); dest_p[1] = (lit_utf8_byte_t) ((hex_digit > 9) ? (hex_digit + ('A' - 10)) : (hex_digit + '0')); hex_digit = (lit_utf8_byte_t) (byte & 0xf); dest_p[2] = (lit_utf8_byte_t) ((hex_digit > 9) ? (hex_digit + ('A' - 10)) : (hex_digit + '0')); } /* ecma_builtin_global_object_byte_to_hex */ /** * Helper function to encode URI. * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_encode_uri_helper (ecma_value_t uri, /**< uri argument */ uint8_t* unescaped_uri_bitset) /**< unescaped bitset */ { ecma_completion_value_t ret_value = ecma_make_empty_completion_value (); ECMA_TRY_CATCH (string, ecma_op_to_string (uri), ret_value); JERRY_ASSERT (ecma_is_value_string (string)); ecma_string_t *input_string_p = ecma_get_string_from_value (string); lit_utf8_size_t input_size = ecma_string_get_size (input_string_p); MEM_DEFINE_LOCAL_ARRAY (input_start_p, input_size, lit_utf8_byte_t); ecma_string_to_utf8_string (input_string_p, input_start_p, (ssize_t) (input_size)); /* * The URI encoding has two major phases: first we validate the input, * and compute the length of the output, then we encode the input. */ lit_utf8_byte_t *input_char_p = input_start_p; lit_utf8_byte_t *input_end_p = input_start_p + input_size; lit_utf8_size_t output_length = 0; while (input_char_p < input_end_p) { /* * We expect that the input is a valid UTF-8 sequence, * so we only need to reject stray surrogate pairs. */ /* Input validation. */ if (*input_char_p <= LIT_UTF8_1_BYTE_CODE_POINT_MAX) { if (ecma_builtin_global_object_character_is_in (*input_char_p, unescaped_uri_bitset)) { output_length++; } else { output_length += URI_ENCODED_BYTE_SIZE; } } else if (*input_char_p == (LIT_UTF8_3_BYTE_MARKER + (LIT_UTF16_HIGH_SURROGATE_MARKER >> 12))) { /* The next character is in the [0xd000, 0xdfff] range. */ output_length += URI_ENCODED_BYTE_SIZE; input_char_p++; JERRY_ASSERT (input_char_p < input_end_p); JERRY_ASSERT ((*input_char_p & LIT_UTF8_EXTRA_BYTE_MASK) == LIT_UTF8_EXTRA_BYTE_MARKER); /* If this condition is true, the next character is >= LIT_UTF16_HIGH_SURROGATE_MIN. */ if (*input_char_p & 0x20) { ret_value = ecma_make_throw_obj_completion_value (ecma_new_standard_error (ECMA_ERROR_URI)); break; } output_length += URI_ENCODED_BYTE_SIZE; } else { output_length += URI_ENCODED_BYTE_SIZE; } input_char_p++; } if (ecma_is_completion_value_empty (ret_value)) { MEM_DEFINE_LOCAL_ARRAY (output_start_p, output_length, lit_utf8_byte_t); lit_utf8_byte_t *output_char_p = output_start_p; input_char_p = input_start_p; while (input_char_p < input_end_p) { /* Input decode. */ if (*input_char_p <= LIT_UTF8_1_BYTE_CODE_POINT_MAX) { if (ecma_builtin_global_object_character_is_in (*input_char_p, unescaped_uri_bitset)) { *output_char_p++ = *input_char_p; } else { ecma_builtin_global_object_byte_to_hex (output_char_p, *input_char_p); output_char_p += URI_ENCODED_BYTE_SIZE; } } else { ecma_builtin_global_object_byte_to_hex (output_char_p, *input_char_p); output_char_p += URI_ENCODED_BYTE_SIZE; } input_char_p++; } JERRY_ASSERT (output_start_p + output_length == output_char_p); ecma_string_t *output_string_p = ecma_new_ecma_string_from_utf8 (output_start_p, output_length); ret_value = ecma_make_normal_completion_value (ecma_make_string_value (output_string_p)); MEM_FINALIZE_LOCAL_ARRAY (output_start_p); } MEM_FINALIZE_LOCAL_ARRAY (input_start_p); ECMA_FINALIZE (string); return ret_value; } /* ecma_builtin_global_object_encode_uri_helper */ /** * The Global object's 'encodeURI' routine * * See also: * ECMA-262 v5, 15.1.3.3 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_encode_uri (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t uri) /**< routine's first argument */ { return ecma_builtin_global_object_encode_uri_helper (uri, unescaped_uri_set); } /* ecma_builtin_global_object_encode_uri */ /** * The Global object's 'encodeURIComponent' routine * * See also: * ECMA-262 v5, 15.1.3.4 * * @return completion value * Returned value must be freed with ecma_free_completion_value. */ static ecma_completion_value_t ecma_builtin_global_object_encode_uri_component (ecma_value_t this_arg __attr_unused___, /**< this argument */ ecma_value_t uri_component) /**< routine's first argument */ { return ecma_builtin_global_object_encode_uri_helper (uri_component, unescaped_uri_component_set); } /* ecma_builtin_global_object_encode_uri_component */ /** * @} * @} * @} */