jerryscript/jerry-core/ecma/builtin-objects/ecma-builtin-global.cpp

/* Copyright 2014-2015 Samsung Electronics Co., Ltd.
 * Copyright 2015 University of Szeged
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "ecma-alloc.h"
#include "ecma-builtins.h"
#include "ecma-conversion.h"
#include "ecma-eval.h"
#include "ecma-exceptions.h"
#include "ecma-gc.h"
#include "ecma-globals.h"
#include "ecma-helpers.h"
#include "ecma-try-catch-macro.h"
#include "jrt.h"
#include "lit-char-helpers.h"
#include "lit-magic-strings.h"
#include "lit-strings.h"
#include "vm.h"
#include "jrt-libc-includes.h"

#define ECMA_BUILTINS_INTERNAL
#include "ecma-builtins-internal.h"

#define BUILTIN_INC_HEADER_NAME "ecma-builtin-global.inc.h"
#define BUILTIN_UNDERSCORED_ID global
#include "ecma-builtin-internal-routines-template.inc.h"

/** \addtogroup ecma ECMA
 * @{
 *
 * \addtogroup ecmabuiltins
 * @{
 *
 * \addtogroup global ECMA Global object built-in
 * @{
 */

/**
 * The implementation-defined Global object's 'print' routine
 *
 * The routine converts all of its arguments to strings and outputs them using 'printf'.
 *
 * Code points, with except of <NUL> character, that are representable with one utf8-byte
 * are outputted as is, using '%c' format argument, and other code points are outputted as '\uhhll',
 * where hh and ll are values of code point's high and low bytes, correspondingly.
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_print (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                  const ecma_value_t args[], /**< arguments list */
                                  ecma_length_t args_number) /**< number of arguments */
{
  ecma_completion_value_t ret_value = ecma_make_empty_completion_value ();

  /*
   * TODO:
   *      Move the 'print' routine out of engine core.
   */

  for (ecma_length_t arg_index = 0;
       ecma_is_completion_value_empty (ret_value) && arg_index < args_number;
       arg_index++)
  {
    ECMA_TRY_CATCH (str_value,
                    ecma_op_to_string (args[arg_index]),
                    ret_value);

    ecma_string_t *str_p = ecma_get_string_from_value (str_value);

    lit_utf8_size_t utf8_str_size = ecma_string_get_size (str_p);

    MEM_DEFINE_LOCAL_ARRAY (utf8_str_p,
                            utf8_str_size,
                            lit_utf8_byte_t);

    ssize_t actual_sz = ecma_string_to_utf8_string (str_p, utf8_str_p, (ssize_t) utf8_str_size);
    JERRY_ASSERT (actual_sz == (ssize_t) utf8_str_size);

    lit_utf8_iterator_t str_iter = lit_utf8_iterator_create (utf8_str_p, utf8_str_size);

    while (!lit_utf8_iterator_is_eos (&str_iter))
    {
      ecma_char_t code_point = lit_utf8_iterator_read_next (&str_iter);

      if (code_point == LIT_CHAR_NULL)
      {
        printf ("\\u0000");
      }
      else if (code_point <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
      {
        printf ("%c", (char) code_point);
      }
      else
      {
        JERRY_STATIC_ASSERT (sizeof (code_point) == 2);

        uint32_t byte_high = (uint32_t) jrt_extract_bit_field (code_point,
                                                               JERRY_BITSINBYTE,
                                                               JERRY_BITSINBYTE);
        uint32_t byte_low = (uint32_t) jrt_extract_bit_field (code_point,
                                                              0,
                                                              JERRY_BITSINBYTE);

        printf ("\\u%02x%02x", byte_high, byte_low);
      }
    }

    if (arg_index < args_number - 1)
    {
      printf (" ");
    }

    MEM_FINALIZE_LOCAL_ARRAY (utf8_str_p);

    ECMA_FINALIZE (str_value);
  }

  printf ("\n");

  if (ecma_is_completion_value_empty (ret_value))
  {
    ret_value = ecma_make_normal_completion_value (ecma_make_simple_value (ECMA_SIMPLE_VALUE_UNDEFINED));
  }

  return ret_value;
} /* ecma_builtin_global_object_print */

/**
 * The Global object's 'eval' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.2.1
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_eval (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                 ecma_value_t x) /**< routine's first argument */
{
  ecma_completion_value_t ret_value = ecma_make_empty_completion_value ();

  bool is_direct_eval = vm_is_direct_eval_form_call ();

  /* See also: ECMA-262 v5, 10.1.1 */
  bool is_called_from_strict_mode_code;
  if (is_direct_eval)
  {
    is_called_from_strict_mode_code = vm_is_strict_mode ();
  }
  else
  {
    is_called_from_strict_mode_code = false;
  }

  if (!ecma_is_value_string (x))
  {
    /* step 1 */
    ret_value = ecma_make_normal_completion_value (ecma_copy_value (x, true));
  }
  else
  {
    /* steps 2 to 8 */
    ret_value = ecma_op_eval (ecma_get_string_from_value (x),
                              is_direct_eval,
                              is_called_from_strict_mode_code);
  }

  return ret_value;
} /* ecma_builtin_global_object_eval */

/**
 * The Global object's 'parseInt' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.2.2
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_parse_int (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                      ecma_value_t string, /**< routine's first argument */
                                      ecma_value_t radix) /**< routine's second argument */
{
  ecma_completion_value_t ret_value = ecma_make_empty_completion_value ();

  /* 1. */
  ECMA_TRY_CATCH (string_var, ecma_op_to_string (string), ret_value);

  ecma_string_t *number_str_p = ecma_get_string_from_value (string_var);
  lit_utf8_size_t str_size = ecma_string_get_size (number_str_p);

  if (str_size > 0)
  {
    MEM_DEFINE_LOCAL_ARRAY (utf8_string_buff, str_size, lit_utf8_byte_t);

    ssize_t bytes_copied = ecma_string_to_utf8_string (number_str_p,
                                                       utf8_string_buff,
                                                       (ssize_t) str_size);
    JERRY_ASSERT (bytes_copied >= 0);
    lit_utf8_iterator_t iter = lit_utf8_iterator_create (utf8_string_buff, str_size);

    /* 2. Remove leading whitespace. */
    lit_utf8_iterator_seek_eos (&iter);

    lit_utf8_iterator_pos_t start = lit_utf8_iterator_get_pos (&iter);
    lit_utf8_iterator_pos_t end = lit_utf8_iterator_get_pos (&iter);

    lit_utf8_iterator_seek_bos (&iter);

    while (!lit_utf8_iterator_is_eos (&iter))
    {
      ecma_char_t current_char = lit_utf8_iterator_read_next (&iter);

      if (!lit_char_is_white_space (current_char)
          && !lit_char_is_line_terminator (current_char))
      {
        lit_utf8_iterator_read_prev (&iter);
        start = lit_utf8_iterator_get_pos (&iter);
        break;
      }
    }

    /* 3. */
    int sign = 1;

    /* 4. */
    ecma_char_t current = lit_utf8_iterator_read_next (&iter);
    if (current == LIT_CHAR_MINUS)
    {
      sign = -1;
    }

    /* 5. */
    if (current == LIT_CHAR_MINUS || current == LIT_CHAR_PLUS)
    {
      start = lit_utf8_iterator_get_pos (&iter);
      if (!lit_utf8_iterator_is_eos (&iter))
      {
        current = lit_utf8_iterator_read_next (&iter);
      }
    }

    /* 6. */
    ECMA_OP_TO_NUMBER_TRY_CATCH (radix_num, radix, ret_value);
    int32_t rad = ecma_number_to_int32 (radix_num);

    /* 7.*/
    bool strip_prefix = true;

    /* 8. */
    if (rad != 0)
    {
      /* 8.a */
      if (rad < 2 || rad > 36)
      {
        ecma_number_t *ret_num_p = ecma_alloc_number ();
        *ret_num_p = ecma_number_make_nan ();
        ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p));
      }
      /* 8.b */
      else if (rad != 16)
      {
        strip_prefix = false;
      }
    }
    /* 9. */
    else
    {
      rad = 10;
    }

    if (ecma_is_completion_value_empty (ret_value))
    {
      /* 10. */
      if (strip_prefix)
      {
        if (end.offset - start.offset >= 2 && current == LIT_CHAR_0)
        {
          ecma_char_t next = lit_utf8_iterator_peek_next (&iter);
          if (next == LIT_CHAR_LOWERCASE_X || next == LIT_CHAR_UPPERCASE_X)
          {
            /* Skip the 'x' or 'X' characters. */
            lit_utf8_iterator_incr (&iter);
            start = lit_utf8_iterator_get_pos (&iter);

            rad = 16;
          }
        }
      }

      /* 11. Check if characters are in [0, Radix - 1]. We also convert them to number values in the process. */
      lit_utf8_iterator_seek (&iter, start);
      while (!lit_utf8_iterator_is_eos (&iter))
      {
        ecma_char_t current_char = lit_utf8_iterator_read_next (&iter);
        int32_t current_number;

        if ((current_char >= LIT_CHAR_LOWERCASE_A && current_char <= LIT_CHAR_LOWERCASE_Z))
        {
          current_number = current_char - LIT_CHAR_LOWERCASE_A + 10;
        }
        else if ((current_char >= LIT_CHAR_UPPERCASE_A && current_char <= LIT_CHAR_UPPERCASE_Z))
        {
          current_number = current_char - LIT_CHAR_UPPERCASE_A + 10;
        }
        else if (lit_char_is_decimal_digit (current_char))
        {
          current_number = current_char - LIT_CHAR_0;
        }
        else
        {
          /* Not a valid number char, set value to radix so it fails to pass as a valid character. */
          current_number = rad;
        }

        if (!(current_number < rad))
        {
          lit_utf8_iterator_decr (&iter);
          end = lit_utf8_iterator_get_pos (&iter);
          break;
        }
      }

      /* 12. */
      if (end.offset - start.offset == 0)
      {
        ecma_number_t *ret_num_p = ecma_alloc_number ();
        *ret_num_p = ecma_number_make_nan ();
        ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p));
      }
    }

    if (ecma_is_completion_value_empty (ret_value))
    {
      ecma_number_t *value_p = ecma_alloc_number ();
      *value_p = 0;
      ecma_number_t multiplier = 1.0f;

      /* 13. and 14. */
      lit_utf8_iterator_seek (&iter, end);
      while (lit_utf8_iterator_get_pos (&iter).offset > start.offset)
      {
        ecma_char_t current_char = lit_utf8_iterator_read_prev (&iter);
        ecma_number_t current_number;

        if ((current_char >= LIT_CHAR_LOWERCASE_A && current_char <= LIT_CHAR_LOWERCASE_Z))
        {
          current_number =  (ecma_number_t) current_char - LIT_CHAR_LOWERCASE_A + 10;
        }
        else if ((current_char >= LIT_CHAR_UPPERCASE_A && current_char <= LIT_CHAR_UPPERCASE_Z))
        {
          current_number =  (ecma_number_t) current_char - LIT_CHAR_UPPERCASE_A + 10;
        }
        else if (lit_char_is_decimal_digit (current_char))
        {
          current_number =  (ecma_number_t) current_char - LIT_CHAR_0;
        }
        else
        {
          JERRY_UNREACHABLE ();
        }

        *value_p += current_number * multiplier;
        multiplier *= (ecma_number_t) rad;
      }

      /* 15. */
      if (sign < 0)
      {
        *value_p *= (ecma_number_t) sign;
      }

      ret_value = ecma_make_normal_completion_value (ecma_make_number_value (value_p));
    }

    ECMA_OP_TO_NUMBER_FINALIZE (radix_num);
    MEM_FINALIZE_LOCAL_ARRAY (utf8_string_buff);
  }
  else
  {
    ecma_number_t *ret_num_p = ecma_alloc_number ();
    *ret_num_p = ecma_number_make_nan ();
    ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p));
  }

  ECMA_FINALIZE (string_var);
  return ret_value;
} /* ecma_builtin_global_object_parse_int */

/**
 * The Global object's 'parseFloat' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.2.3
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_parse_float (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                        ecma_value_t string) /**< routine's first argument */
{
  ecma_completion_value_t ret_value = ecma_make_empty_completion_value ();

  /* 1. */
  ECMA_TRY_CATCH (string_var, ecma_op_to_string (string), ret_value);

  ecma_string_t *number_str_p = ecma_get_string_from_value (string_var);
  lit_utf8_size_t str_size = ecma_string_get_size (number_str_p);

  if (str_size > 0)
  {
    MEM_DEFINE_LOCAL_ARRAY (utf8_string_buff, str_size, lit_utf8_byte_t);

    ssize_t bytes_copied = ecma_string_to_utf8_string (number_str_p,
                                                       utf8_string_buff,
                                                       (ssize_t) str_size);
    JERRY_ASSERT (bytes_copied >= 0);
    lit_utf8_iterator_t iter = lit_utf8_iterator_create (utf8_string_buff, str_size);

    lit_utf8_iterator_seek_eos (&iter);

    lit_utf8_iterator_pos_t start = lit_utf8_iterator_get_pos (&iter);
    lit_utf8_iterator_pos_t end = lit_utf8_iterator_get_pos (&iter);

    lit_utf8_iterator_seek_bos (&iter);


    /* 2. Find first non whitespace char and set starting position. */
    while (!lit_utf8_iterator_is_eos (&iter))
    {
      ecma_char_t current_char = lit_utf8_iterator_read_next (&iter);

      if (!lit_char_is_white_space (current_char)
          && !lit_char_is_line_terminator (current_char))
      {
        lit_utf8_iterator_decr (&iter);
        start = lit_utf8_iterator_get_pos (&iter);
        break;
      }
    }

    bool sign = false;
    ecma_char_t current;

    if (!lit_utf8_iterator_is_eos (&iter))
    {
      /* Check if sign is present. */
      current = lit_utf8_iterator_read_next (&iter);
      if (current == LIT_CHAR_MINUS)
      {
        sign = true;
      }

      if (current == LIT_CHAR_MINUS || current == LIT_CHAR_PLUS)
      {
        /* Set starting position to be after the sign character. */
        start = lit_utf8_iterator_get_pos (&iter);
      }
      else
      {
        lit_utf8_iterator_decr (&iter);
      }
    }

    ecma_number_t *ret_num_p = ecma_alloc_number ();

    const lit_utf8_byte_t *infinity_utf8_str_p = lit_get_magic_string_utf8 (LIT_MAGIC_STRING_INFINITY_UL);
    lit_utf8_iterator_t infinity_iter = lit_utf8_iterator_create (infinity_utf8_str_p,
                                                                  sizeof (*infinity_utf8_str_p));

    JERRY_ASSERT (!lit_utf8_iterator_is_eos (&infinity_iter));

    /* Check if string is equal to "Infinity". */
    while (!lit_utf8_iterator_is_eos (&iter)
           && (lit_utf8_iterator_read_next (&iter) == lit_utf8_iterator_read_next (&infinity_iter)))
    {
      if (lit_utf8_iterator_is_eos (&infinity_iter))
      {
        /* String matched Infinity. */
        *ret_num_p = ecma_number_make_infinity (sign);
        ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p));
        break;
      }
    }

    /* Reset to starting position. */
    lit_utf8_iterator_seek (&iter, start);

    if (ecma_is_completion_value_empty (ret_value) && !lit_utf8_iterator_is_eos (&iter))
    {
      current = lit_utf8_iterator_read_next (&iter);

      bool has_whole_part = false;
      bool has_fraction_part = false;

      /* Check digits of whole part. */
      if (lit_char_is_decimal_digit (current))
      {
        has_whole_part = true;

        while (!lit_utf8_iterator_is_eos (&iter))
        {
          current = lit_utf8_iterator_read_next (&iter);
          if (!lit_char_is_decimal_digit (current))
          {
            lit_utf8_iterator_decr (&iter);
            break;
          }
        }
      }
      else
      {
        lit_utf8_iterator_decr (&iter);
      }

      /* Set end position to the end of whole part. */
      end = lit_utf8_iterator_get_pos (&iter);
      if (!lit_utf8_iterator_is_eos (&iter))
      {
        current = lit_utf8_iterator_read_next (&iter);
      }

      /* Check decimal point. */
      if (current == LIT_CHAR_DOT && !lit_utf8_iterator_is_eos (&iter))
      {
        current = lit_utf8_iterator_read_next (&iter);

        if (lit_char_is_decimal_digit (current))
        {
          has_fraction_part = true;

          /* Check digits of fractional part. */
          while (!lit_utf8_iterator_is_eos (&iter))
          {
            current = lit_utf8_iterator_read_next (&iter);
            if (!lit_char_is_decimal_digit (current))
            {
              lit_utf8_iterator_decr (&iter);
              break;
            }
          }

          /* Set end position to end of fraction part. */
          end = lit_utf8_iterator_get_pos (&iter);
        }
        else
        {
          lit_utf8_iterator_decr (&iter);
        }
      }
      else
      {
        lit_utf8_iterator_decr (&iter);
      }

      if (!lit_utf8_iterator_is_eos (&iter))
      {
        current = lit_utf8_iterator_read_next (&iter);
      }

      /* Check exponent. */
      if ((current == LIT_CHAR_LOWERCASE_E || current == LIT_CHAR_UPPERCASE_E)
          && (has_whole_part || has_fraction_part)
          && !lit_utf8_iterator_is_eos (&iter))
      {
        current = lit_utf8_iterator_read_next (&iter);

        /* Check sign of exponent. */
        if ((current == LIT_CHAR_PLUS || current == LIT_CHAR_MINUS)
             && !lit_utf8_iterator_is_eos (&iter))
        {
          current = lit_utf8_iterator_read_next (&iter);
        }

        if (lit_char_is_decimal_digit (current))
        {
          /* Check digits of exponent part. */
          while (!lit_utf8_iterator_is_eos (&iter))
          {
            current = lit_utf8_iterator_read_next (&iter);
            if (!lit_char_is_decimal_digit (current))
            {
              lit_utf8_iterator_decr (&iter);
              break;
            }
          }

          /* Set end position to end of exponent part. */
          end = lit_utf8_iterator_get_pos (&iter);
        }
      }
      else
      {
        lit_utf8_iterator_decr (&iter);
      }

      /* String did not contain a valid number. */
      if (start.offset == end.offset)
      {
        *ret_num_p = ecma_number_make_nan ();
        ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p));
      }
      else
      {
        /* 5. */
        *ret_num_p = ecma_utf8_string_to_number (utf8_string_buff + start.offset,
                                                 (lit_utf8_size_t) (end.offset - start.offset));

        if (sign)
        {
          *ret_num_p *= -1;
        }

        ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p));
      }
    }
    /* String ended after sign character, or was empty after removing leading whitespace. */
    else if (ecma_is_completion_value_empty (ret_value))
    {
      *ret_num_p = ecma_number_make_nan ();
      ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p));
    }
    MEM_FINALIZE_LOCAL_ARRAY (utf8_string_buff);
  }
  /* String length is zero. */
  else
  {
    ecma_number_t *ret_num_p = ecma_alloc_number ();
    *ret_num_p = ecma_number_make_nan ();
    ret_value = ecma_make_normal_completion_value (ecma_make_number_value (ret_num_p));
  }

  ECMA_FINALIZE (string_var);

  return ret_value;
} /* ecma_builtin_global_object_parse_float */

/**
 * The Global object's 'isNaN' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.2.4
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_is_nan (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                   ecma_value_t arg) /**< routine's first argument */
{
  ecma_completion_value_t ret_value = ecma_make_empty_completion_value ();

  ECMA_OP_TO_NUMBER_TRY_CATCH (arg_num, arg, ret_value);

  bool is_nan = ecma_number_is_nan (arg_num);

  ret_value = ecma_make_simple_completion_value (is_nan ? ECMA_SIMPLE_VALUE_TRUE
                                                        : ECMA_SIMPLE_VALUE_FALSE);

  ECMA_OP_TO_NUMBER_FINALIZE (arg_num);

  return ret_value;
} /* ecma_builtin_global_object_is_nan */

/**
 * The Global object's 'isFinite' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.2.5
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_is_finite (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                      ecma_value_t arg) /**< routine's first argument */
{
  ecma_completion_value_t ret_value = ecma_make_empty_completion_value ();

  ECMA_OP_TO_NUMBER_TRY_CATCH (arg_num, arg, ret_value);

  bool is_finite = !(ecma_number_is_nan (arg_num)
                     || ecma_number_is_infinity (arg_num));

  ret_value = ecma_make_simple_completion_value (is_finite ? ECMA_SIMPLE_VALUE_TRUE
                                                           : ECMA_SIMPLE_VALUE_FALSE);

  ECMA_OP_TO_NUMBER_FINALIZE (arg_num);

  return ret_value;
} /* ecma_builtin_global_object_is_finite */

/**
 * Helper function to check whether a character is in a character bitset.
 *
 * @return true if the character is in the character bitset.
 */
static bool
ecma_builtin_global_object_character_is_in (uint32_t character, /**< character */
                                            uint8_t *bitset) /**< character set */
{
  JERRY_ASSERT (character < 128);
  return (bitset[character >> 3] & (1 << (character & 0x7))) != 0;
} /* ecma_builtin_global_object_character_is_in */

/*
 * Unescaped URI characters bitset:
 *   One bit for each character between 0 - 127.
 *   Bit is set if the character is in the unescaped URI set.
 */
static uint8_t unescaped_uri_set[16] =
{
  0x0, 0x0, 0x0, 0x0, 0xda, 0xff, 0xff, 0xaf,
  0xff, 0xff, 0xff, 0x87, 0xfe, 0xff, 0xff, 0x47
};

/*
 * Unescaped URI component characters bitset:
 *   One bit for each character between 0 - 127.
 *   Bit is set if the character is in the unescaped component URI set.
 */
static uint8_t unescaped_uri_component_set[16] =
{
  0x0, 0x0, 0x0, 0x0, 0x82, 0x67, 0xff, 0x3,
  0xfe, 0xff, 0xff, 0x87, 0xfe, 0xff, 0xff, 0x47
};

/*
 * Format is a percent sign followed by two hex digits.
 */
#define URI_ENCODED_BYTE_SIZE (3)

/*
 * These two types shows whether the byte is present in
 * the original stream or decoded from a %xx sequence.
 */
#define URI_DECODE_ORIGINAL_BYTE 0
#define URI_DECODE_DECODED_BYTE 1

/**
 * Helper function to decode URI.
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_decode_uri_helper (ecma_value_t uri __attr_unused___, /**< uri argument */
                                              uint8_t *reserved_uri_bitset) /**< reserved characters bitset */
{
  ecma_completion_value_t ret_value = ecma_make_empty_completion_value ();

  ECMA_TRY_CATCH (string,
                  ecma_op_to_string (uri),
                  ret_value);

  JERRY_ASSERT (ecma_is_value_string (string));

  ecma_string_t *input_string_p = ecma_get_string_from_value (string);
  lit_utf8_size_t input_size = ecma_string_get_size (input_string_p);

  MEM_DEFINE_LOCAL_ARRAY (input_start_p,
                          input_size + 1,
                          lit_utf8_byte_t);

  ecma_string_to_utf8_string (input_string_p,
                              input_start_p,
                              (ssize_t) (input_size));
  input_start_p[input_size] = LIT_BYTE_NULL;

  lit_utf8_byte_t *input_char_p = input_start_p;
  lit_utf8_byte_t *input_end_p = input_start_p + input_size;
  lit_utf8_size_t output_size = 0;

  /*
   * The URI decoding has two major phases: first we validate the input,
   * and compute the length of the output, then we decode the input.
   */

  while (input_char_p < input_end_p)
  {
    /*
     * We expect that the input is a valid UTF-8 sequence,
     * so characters >= 0x80 can be let through.
     */

    if (*input_char_p != '%')
    {
      output_size++;
      input_char_p++;
      continue;
    }

    lit_code_point_t decoded_byte;

    if (!lit_read_code_point_from_hex (input_char_p + 1, 2, &decoded_byte))
    {
      ret_value = ecma_make_throw_obj_completion_value (ecma_new_standard_error (ECMA_ERROR_URI));
      break;
    }

    input_char_p += URI_ENCODED_BYTE_SIZE;

    if (decoded_byte <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
    {
      /*
       * We don't decode those bytes, which are part of reserved_uri_bitset
       * but not part of unescaped_uri_component_set.
       */
      if (ecma_builtin_global_object_character_is_in (decoded_byte, reserved_uri_bitset)
          && !ecma_builtin_global_object_character_is_in (decoded_byte, unescaped_uri_component_set))
      {
        output_size += URI_ENCODED_BYTE_SIZE;
      }
      else
      {
        output_size++;
      }
    }
    else
    {
      output_size++;
    }
  }

  if (ecma_is_completion_value_empty (ret_value))
  {
    MEM_DEFINE_LOCAL_ARRAY (output_start_p,
                            output_size * 2,
                            lit_utf8_byte_t);

    input_char_p = input_start_p;
    lit_utf8_byte_t *output_char_p = output_start_p;
    lit_utf8_byte_t *output_type_p = output_start_p + output_size;

    while (input_char_p < input_end_p)
    {
      /* Input decode. */
      if (*input_char_p != '%')
      {
        *output_type_p++ = URI_DECODE_ORIGINAL_BYTE;
        *output_char_p = *input_char_p;
        output_char_p++;
        input_char_p++;
        continue;
      }

      *output_type_p++ = URI_DECODE_DECODED_BYTE;

      lit_code_point_t decoded_byte;

      lit_read_code_point_from_hex (input_char_p + 1, 2, &decoded_byte);
      input_char_p += URI_ENCODED_BYTE_SIZE;

      if (decoded_byte <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
      {
        if (ecma_builtin_global_object_character_is_in (decoded_byte, reserved_uri_bitset)
            && !ecma_builtin_global_object_character_is_in (decoded_byte, unescaped_uri_component_set))
        {
          *output_char_p = '%';
          output_char_p++;
          input_char_p -= 2;
        }
        else
        {
          *output_char_p = (lit_utf8_byte_t) decoded_byte;
          output_char_p++;
        }
      }
      else
      {
        *output_char_p = (lit_utf8_byte_t) decoded_byte;
        output_char_p++;
      }
    }

    JERRY_ASSERT (output_start_p + output_size == output_char_p);

    bool valid_utf8 = lit_is_utf8_string_valid (output_start_p, output_size);

    if (valid_utf8)
    {
      lit_utf8_iterator_t characters = lit_utf8_iterator_create (output_start_p, output_size);
      output_type_p = output_start_p + output_size;

      while (!lit_utf8_iterator_is_eos (&characters))
      {
        bool original_byte = output_type_p[characters.buf_pos.offset] == URI_DECODE_ORIGINAL_BYTE;

        ecma_char_t character = lit_utf8_iterator_read_next (&characters);

        /* Surrogate fragments are allowed in JS, but not accepted by URI decoding. */
        if (!original_byte)
        {
          if (lit_is_code_unit_high_surrogate (character))
          {
            /* Note: stray high/low surrogate pairs are not allowed in the stream. */
            if (lit_utf8_iterator_is_eos (&characters))
            {
              valid_utf8 = false;
              break;
            }

            if (output_type_p[characters.buf_pos.offset] == URI_DECODE_ORIGINAL_BYTE
                || !lit_is_code_unit_low_surrogate (lit_utf8_iterator_read_next (&characters)))
            {
              valid_utf8 = false;
              break;
            }
          }
          else if (lit_is_code_unit_low_surrogate (character))
          {
            valid_utf8 = false;
            break;
          }
        }
      }
    }

    if (valid_utf8)
    {
      ecma_string_t *output_string_p = ecma_new_ecma_string_from_utf8 (output_start_p, output_size);
      ret_value = ecma_make_normal_completion_value (ecma_make_string_value (output_string_p));
    }
    else
    {
      ret_value = ecma_make_throw_obj_completion_value (ecma_new_standard_error (ECMA_ERROR_URI));
    }

    MEM_FINALIZE_LOCAL_ARRAY (output_start_p);
  }

  MEM_FINALIZE_LOCAL_ARRAY (input_start_p);

  ECMA_FINALIZE (string);
  return ret_value;
} /* ecma_builtin_global_object_decode_uri_helper */

/**
 * The Global object's 'decodeURI' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.3.1
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_decode_uri (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                       ecma_value_t encoded_uri) /**< routine's first argument */
{
  return ecma_builtin_global_object_decode_uri_helper (encoded_uri, unescaped_uri_set);
} /* ecma_builtin_global_object_decode_uri */

/**
 * The Global object's 'decodeURIComponent' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.3.2
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_decode_uri_component (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                                 ecma_value_t encoded_uri_component) /**< routine's
                                                                                      *   first argument */
{
  return ecma_builtin_global_object_decode_uri_helper (encoded_uri_component, unescaped_uri_component_set);
} /* ecma_builtin_global_object_decode_uri_component */

/**
 * Helper function to encode byte as hexadecimal values.
 */
static void
ecma_builtin_global_object_byte_to_hex (lit_utf8_byte_t *dest_p, /**< destination pointer */
                                        uint32_t byte) /**< value */
{
  JERRY_ASSERT (byte < 256);

  dest_p[0] = '%';
  ecma_char_t hex_digit = (ecma_char_t) (byte >> 4);
  dest_p[1] = (lit_utf8_byte_t) ((hex_digit > 9) ? (hex_digit + ('A' - 10)) : (hex_digit + '0'));
  hex_digit = (lit_utf8_byte_t) (byte & 0xf);
  dest_p[2] = (lit_utf8_byte_t) ((hex_digit > 9) ? (hex_digit + ('A' - 10)) : (hex_digit + '0'));
} /* ecma_builtin_global_object_byte_to_hex */

/**
 * Helper function to encode URI.
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_encode_uri_helper (ecma_value_t uri, /**< uri argument */
                                              uint8_t* unescaped_uri_bitset) /**< unescaped bitset */
{
  ecma_completion_value_t ret_value = ecma_make_empty_completion_value ();

  ECMA_TRY_CATCH (string,
                  ecma_op_to_string (uri),
                  ret_value);

  JERRY_ASSERT (ecma_is_value_string (string));

  ecma_string_t *input_string_p = ecma_get_string_from_value (string);
  lit_utf8_size_t input_size = ecma_string_get_size (input_string_p);

  MEM_DEFINE_LOCAL_ARRAY (input_start_p,
                          input_size,
                          lit_utf8_byte_t);

  ecma_string_to_utf8_string (input_string_p,
                              input_start_p,
                              (ssize_t) (input_size));

  /*
   * The URI encoding has two major phases: first we validate the input,
   * and compute the length of the output, then we encode the input.
   */

  lit_utf8_byte_t *input_char_p = input_start_p;
  lit_utf8_byte_t *input_end_p = input_start_p + input_size;
  lit_utf8_size_t output_length = 0;

  while (input_char_p < input_end_p)
  {
    /*
     * We expect that the input is a valid UTF-8 sequence,
     * so we only need to reject stray surrogate pairs.
     */

    /* Input validation. */
    if (*input_char_p <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
    {
      if (ecma_builtin_global_object_character_is_in (*input_char_p, unescaped_uri_bitset))
      {
        output_length++;
      }
      else
      {
        output_length += URI_ENCODED_BYTE_SIZE;
      }
    }
    else if (*input_char_p == (LIT_UTF8_3_BYTE_MARKER + (LIT_UTF16_HIGH_SURROGATE_MARKER >> 12)))
    {
      /* The next character is in the [0xd000, 0xdfff] range. */
      output_length += URI_ENCODED_BYTE_SIZE;
      input_char_p++;
      JERRY_ASSERT (input_char_p < input_end_p);
      JERRY_ASSERT ((*input_char_p & LIT_UTF8_EXTRA_BYTE_MASK) == LIT_UTF8_EXTRA_BYTE_MARKER);

      /* If this condition is true, the next character is >= LIT_UTF16_HIGH_SURROGATE_MIN. */
      if (*input_char_p & 0x20)
      {
        ret_value = ecma_make_throw_obj_completion_value (ecma_new_standard_error (ECMA_ERROR_URI));
        break;
      }
      output_length += URI_ENCODED_BYTE_SIZE;
    }
    else
    {
      output_length += URI_ENCODED_BYTE_SIZE;
    }

    input_char_p++;
  }

  if (ecma_is_completion_value_empty (ret_value))
  {
    MEM_DEFINE_LOCAL_ARRAY (output_start_p,
                            output_length,
                            lit_utf8_byte_t);

    lit_utf8_byte_t *output_char_p = output_start_p;
    input_char_p = input_start_p;

    while (input_char_p < input_end_p)
    {
      /* Input decode. */

      if (*input_char_p <= LIT_UTF8_1_BYTE_CODE_POINT_MAX)
      {
        if (ecma_builtin_global_object_character_is_in (*input_char_p, unescaped_uri_bitset))
        {
          *output_char_p++ = *input_char_p;
        }
        else
        {
          ecma_builtin_global_object_byte_to_hex (output_char_p, *input_char_p);
          output_char_p += URI_ENCODED_BYTE_SIZE;
        }
      }
      else
      {
        ecma_builtin_global_object_byte_to_hex (output_char_p, *input_char_p);
        output_char_p += URI_ENCODED_BYTE_SIZE;
      }

      input_char_p++;
    }

    JERRY_ASSERT (output_start_p + output_length == output_char_p);

    ecma_string_t *output_string_p = ecma_new_ecma_string_from_utf8 (output_start_p, output_length);

    ret_value = ecma_make_normal_completion_value (ecma_make_string_value (output_string_p));

    MEM_FINALIZE_LOCAL_ARRAY (output_start_p);
  }

  MEM_FINALIZE_LOCAL_ARRAY (input_start_p);

  ECMA_FINALIZE (string);
  return ret_value;
} /* ecma_builtin_global_object_encode_uri_helper */

/**
 * The Global object's 'encodeURI' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.3.3
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_encode_uri (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                       ecma_value_t uri) /**< routine's first argument */
{
  return ecma_builtin_global_object_encode_uri_helper (uri, unescaped_uri_set);
} /* ecma_builtin_global_object_encode_uri */

/**
 * The Global object's 'encodeURIComponent' routine
 *
 * See also:
 *          ECMA-262 v5, 15.1.3.4
 *
 * @return completion value
 *         Returned value must be freed with ecma_free_completion_value.
 */
static ecma_completion_value_t
ecma_builtin_global_object_encode_uri_component (ecma_value_t this_arg __attr_unused___, /**< this argument */
                                                 ecma_value_t uri_component) /**< routine's first argument */
{
  return ecma_builtin_global_object_encode_uri_helper (uri_component, unescaped_uri_component_set);
} /* ecma_builtin_global_object_encode_uri_component */

/**
 * @}
 * @}
 * @}
 */