scanner_8cc_source.html

// Copyright 2011 the V8 project authors. All rights reserved.

// Use of this source code is governed by a BSD-style license that can be

// found in the LICENSE file.


// Features shared by parsing and pre-parsing scanners.


#include "src/parsing/scanner.h"


#include <stdint.h>


#include <cmath>

#include <optional>


#include "src/ast/ast-value-factory.h"

#include "src/base/strings.h"

#include "src/base/vlq-base64.h"

#include "src/numbers/conversions-inl.h"

#include "src/numbers/conversions.h"

#include "src/objects/bigint.h"

#include "src/parsing/parse-info.h"

#include "src/parsing/scanner-inl.h"

#include "src/zone/zone.h"


namespace v8::internal {


class Scanner::ErrorState {

 public:


  ErrorState(MessageTemplate* message_stack, Scanner::Location* location_stack)

      : message_stack_(message_stack),

        old_message_(*message_stack),

        location_stack_(location_stack),

        old_location_(*location_stack) {

    *message_stack_ = MessageTemplate::kNone;

    *location_stack_ = Location::invalid();

  }


  ~ErrorState() {

    *message_stack_ = old_message_;

    *location_stack_ = old_location_;

  }


  void MoveErrorTo(TokenDesc* dest) {

    if (*message_stack_ == MessageTemplate::kNone) {

      return;

    }

    if (dest->invalid_template_escape_message == MessageTemplate::kNone) {

      dest->invalid_template_escape_message = *message_stack_;

      dest->invalid_template_escape_location = *location_stack_;

    }

    *message_stack_ = MessageTemplate::kNone;

    *location_stack_ = Location::invalid();

  }


 private:

  MessageTemplate* const message_stack_;

  MessageTemplate const old_message_;

  Scanner::Location* const location_stack_;

  Scanner::Location const old_location_;

};


// ----------------------------------------------------------------------------

// Scanner::BookmarkScope


const size_t Scanner::BookmarkScope::kNoBookmark =

    std::numeric_limits<size_t>::max() - 1;

const size_t Scanner::BookmarkScope::kBookmarkWasApplied =

    std::numeric_limits<size_t>::max();


void Scanner::BookmarkScope::Set(size_t position) {

  DCHECK_EQ(bookmark_, kNoBookmark);

  bookmark_ = position;

}


void Scanner::BookmarkScope::Apply() {

  DCHECK(HasBeenSet());  // Caller hasn't called SetBookmark.

  if (had_parser_error_) {

    scanner_->set_parser_error();

  } else {

    scanner_->reset_parser_error_flag();

    scanner_->SeekNext(bookmark_);

  }

  bookmark_ = kBookmarkWasApplied;

}


bool Scanner::BookmarkScope::HasBeenSet() const {

  return bookmark_ != kNoBookmark && bookmark_ != kBookmarkWasApplied;

}


bool Scanner::BookmarkScope::HasBeenApplied() const {

  return bookmark_ == kBookmarkWasApplied;

}


// ----------------------------------------------------------------------------

// Scanner


Scanner::Scanner(Utf16CharacterStream* source, UnoptimizedCompileFlags flags)

    : flags_(flags),

      source_(source),

      found_html_comment_(false),

      octal_pos_(Location::invalid()),

      octal_message_(MessageTemplate::kNone) {

  DCHECK_NOT_NULL(source);

}


void Scanner::Initialize() {

  // Need to capture identifiers in order to recognize "get" and "set"

  // in object literals.

  Init();

  next().after_line_terminator = true;

  Scan();

}


// static


bool Scanner::IsInvalid(base::uc32 c) {

  DCHECK(c == Invalid() || base::IsInRange(c, 0u, String::kMaxCodePoint));

  return c == Scanner::Invalid();

}


template <bool capture_raw, bool unicode>


base::uc32 Scanner::ScanHexNumber(int expected_length) {

  DCHECK_LE(expected_length, 4);  // prevent overflow


  int begin = source_pos() - 2;

  base::uc32 x = 0;

  for (int i = 0; i < expected_length; i++) {

    int d = base::HexValue(c0_);

    if (d < 0) {

      ReportScannerError(Location(begin, begin + expected_length + 2),

                         unicode

                             ? MessageTemplate::kInvalidUnicodeEscapeSequence

                             : MessageTemplate::kInvalidHexEscapeSequence);

      return Invalid();

    }

    x = x * 16 + d;

    Advance<capture_raw>();

  }


  return x;

}


template <bool capture_raw>


base::uc32 Scanner::ScanUnlimitedLengthHexNumber(base::uc32 max_value,

                                                 int beg_pos) {

  base::uc32 x = 0;

  int d = base::HexValue(c0_);

  if (d < 0) return Invalid();


  while (d >= 0) {

    x = x * 16 + d;

    if (x > max_value) {

      ReportScannerError(Location(beg_pos, source_pos() + 1),

                         MessageTemplate::kUndefinedUnicodeCodePoint);

      return Invalid();

    }

    Advance<capture_raw>();

    d = base::HexValue(c0_);

  }


  return x;

}


Token::Value Scanner::Next() {

  // Rotate through tokens.

  TokenDesc* previous = current_;

  current_ = next_;

  // Either we already have the next token lined up, in which case next_next_

  // simply becomes next_. In that case we use current_ as new next_next_ and

  // clear its token to indicate that it wasn't scanned yet. Otherwise we use

  // current_ as next_ and scan into it, leaving next_next_ uninitialized.

  if (V8_LIKELY(next_next().token == Token::kUninitialized)) {

    DCHECK(next_next_next().token == Token::kUninitialized);

    next_ = previous;

    // User 'previous' instead of 'next_' because for some reason the compiler

    // thinks 'next_' could be modified before the entry into Scan.

    previous->after_line_terminator = false;

    Scan(previous);

  } else {

    next_ = next_next_;


    if (V8_LIKELY(next_next_next().token == Token::kUninitialized)) {

      next_next_ = previous;

    } else {

      next_next_ = next_next_next_;

      next_next_next_ = previous;

    }


    previous->token = Token::kUninitialized;

    DCHECK_NE(Token::kUninitialized, current().token);

  }

  return current().token;

}


Token::Value Scanner::PeekAhead() {

  DCHECK(next().token != Token::kDiv);

  DCHECK(next().token != Token::kAssignDiv);


  if (next_next().token != Token::kUninitialized) {

    return next_next().token;

  }

  TokenDesc* temp = next_;

  next_ = next_next_;

  next().after_line_terminator = false;

  Scan();

  next_next_ = next_;

  next_ = temp;

  return next_next().token;

}


Token::Value Scanner::PeekAheadAhead() {

  if (next_next_next().token != Token::kUninitialized) {

    return next_next_next().token;

  }

  // PeekAhead() must be called first in order to call PeekAheadAhead().

  DCHECK(next_next().token != Token::kUninitialized);

  TokenDesc* temp = next_;

  TokenDesc* temp_next = next_next_;

  next_ = next_next_next_;

  next().after_line_terminator = false;

  Scan();

  next_next_next_ = next_;

  next_next_ = temp_next;

  next_ = temp;

  return next_next_next().token;

}


Token::Value Scanner::SkipSingleHTMLComment() {

  if (flags_.is_module()) {

    ReportScannerError(source_pos(), MessageTemplate::kHtmlCommentInModule);

    return Token::kIllegal;

  }

  return SkipSingleLineComment();

}


Token::Value Scanner::SkipSingleLineComment() {

  // The line terminator at the end of the line is not considered

  // to be part of the single-line comment; it is recognized

  // separately by the lexical grammar and becomes part of the

  // stream of input elements for the syntactic grammar (see

  // ECMA-262, section 7.4).

  AdvanceUntil([](base::uc32 c0) { return unibrow::IsLineTerminator(c0); });


  return Token::kWhitespace;

}


Token::Value Scanner::SkipMagicComment(base::uc32 hash_or_at_sign) {

  TryToParseMagicComment(hash_or_at_sign);

  if (unibrow::IsLineTerminator(c0_) || c0_ == kEndOfInput) {

    return Token::kWhitespace;

  }

  return SkipSingleLineComment();

}


namespace {


void ProcessPerFunctionCompileHints(const base::Vector<const uint8_t>& data,

                                    int current_position,

                                    std::vector<int>& positions) {

  // Compile hints are relative to the position of the comment end.

  int last_position = current_position;

  size_t pos = 0;

  const char* char_data = reinterpret_cast<const char*>(data.data());

  while (pos < static_cast<size_t>(data.length())) {

    int32_t delta = base::VLQBase64Decode(char_data, data.length(), &pos);

    if (delta == std::numeric_limits<int32_t>::min()) {

      // Invalid data, bail out and clear the data we read so far. (Not using

      // the data until the invalid portion is consistent with 2-byte data not

      // being handled at all.)

      positions.clear();

      return;

    }

    last_position += delta;

    positions.push_back(last_position);

  }

  positions.shrink_to_fit();

}


}  // namespace


void Scanner::TryToParseMagicComment(base::uc32 hash_or_at_sign) {

  // Magic comments are of the form: //[#@]\s<name>=\s*<value>\s*.* and this

  // function will just return if it cannot parse a magic comment.

  DCHECK(!IsWhiteSpaceOrLineTerminator(kEndOfInput));

  if (!IsWhiteSpace(c0_)) return;

  Advance();

  LiteralBuffer name;

  name.Start();


  while (c0_ != kEndOfInput && !IsWhiteSpaceOrLineTerminator(c0_) &&

         c0_ != '=') {

    name.AddChar(c0_);

    Advance();

  }

  if (!name.is_one_byte()) return;

  base::Vector<const uint8_t> name_literal = name.one_byte_literal();

  LiteralBuffer* value;

  LiteralBuffer per_function_compile_hints_value;

  if (name_literal == base::StaticOneByteVector("sourceURL")) {

    value = &source_url_;

  } else if (name_literal == base::StaticOneByteVector("sourceMappingURL")) {

    value = &source_mapping_url_;

    DCHECK(hash_or_at_sign == '#' || hash_or_at_sign == '@');

    saw_source_mapping_url_magic_comment_at_sign_ = hash_or_at_sign == '@';

  } else if (!saw_non_comment_ &&

             name_literal ==

                 base::StaticOneByteVector("allFunctionsCalledOnLoad") &&

             hash_or_at_sign == '#' && c0_ != '=') {

    saw_magic_comment_compile_hints_all_ = true;

  } else if (name_literal ==

                 base::StaticOneByteVector("functionsCalledOnLoad") &&

             hash_or_at_sign == '#') {

    value = &per_function_compile_hints_value;

  } else {

    return;

  }

  if (c0_ != '=')

    return;

  value->Start();

  Advance();

  while (IsWhiteSpace(c0_)) {

    Advance();

  }

  while (c0_ != kEndOfInput && !unibrow::IsLineTerminator(c0_)) {

    if (IsWhiteSpace(c0_)) {

      break;

    }

    value->AddChar(c0_);

    Advance();

  }

  // Allow whitespace at the end.

  while (c0_ != kEndOfInput && !unibrow::IsLineTerminator(c0_)) {

    if (!IsWhiteSpace(c0_)) {

      value->Start();

      break;

    }

    Advance();

  }

  if (value == &per_function_compile_hints_value &&

      per_function_compile_hints_value.is_one_byte()) {

    base::Vector<const uint8_t> value_literal =

        per_function_compile_hints_value.one_byte_literal();

    per_function_compile_hint_positions_.clear();

    per_function_compile_hint_positions_idx_ = 0;

    ProcessPerFunctionCompileHints(value_literal, source_pos(),

                                   per_function_compile_hint_positions_);

  }

}


bool Scanner::HasPerFunctionCompileHint(int position) {

  // Allow off-by-<slack> in the compile hints positions, to account for adding

  // newlines at the end of the comment, function positions being off-by-one,

  // etc.

  const int kSlack = 3;

  while (per_function_compile_hint_positions_idx_ <

             per_function_compile_hint_positions_.size() &&

         per_function_compile_hint_positions_

                 [per_function_compile_hint_positions_idx_] <

             position - kSlack) {

    ++per_function_compile_hint_positions_idx_;

  }

  if (per_function_compile_hint_positions_idx_ >=

      per_function_compile_hint_positions_.size()) {

    return false;

  }

  int hint_position = per_function_compile_hint_positions_

      [per_function_compile_hint_positions_idx_];

  return hint_position >= position - kSlack &&

         hint_position <= position + kSlack;

}


Token::Value Scanner::SkipMultiLineComment() {

  DCHECK_EQ(c0_, '*');


  // Until we see the first newline, check for * and newline characters.

  if (!next().after_line_terminator) {

    do {

      AdvanceUntil([](base::uc32 c0) {

        if (V8_UNLIKELY(static_cast<uint32_t>(c0) > kMaxAscii)) {

          return unibrow::IsLineTerminator(c0);

        }

        uint8_t char_flags = character_scan_flags[c0];

        return MultilineCommentCharacterNeedsSlowPath(char_flags);

      });


      while (c0_ == '*') {

        Advance();

        if (c0_ == '/') {

          Advance();

          return Token::kWhitespace;

        }

      }


      if (unibrow::IsLineTerminator(c0_)) {

        next().after_line_terminator = true;

        break;

      }

    } while (c0_ != kEndOfInput);

  }


  // After we've seen newline, simply try to find '*/'.

  while (c0_ != kEndOfInput) {

    AdvanceUntil([](base::uc32 c0) { return c0 == '*'; });


    while (c0_ == '*') {

      Advance();

      if (c0_ == '/') {

        Advance();

        return Token::kWhitespace;

      }

    }

  }


  return Token::kIllegal;

}


Token::Value Scanner::ScanHtmlComment() {

  // Check for <!-- comments.

  DCHECK_EQ(c0_, '!');

  Advance();

  if (c0_ != '-' || Peek() != '-') {

    PushBack('!');  // undo Advance()

    return Token::kLessThan;

  }

  Advance();


  found_html_comment_ = true;

  return SkipSingleHTMLComment();

}


#ifdef DEBUG

void Scanner::SanityCheckTokenDesc(const TokenDesc& token) const {

  // Only TEMPLATE_* tokens can have an invalid_template_escape_message.

  // kIllegal and kUninitialized can have garbage for the field.


  switch (token.token) {

    case Token::kUninitialized:

    case Token::kIllegal:

      // token.literal_chars & other members might be garbage. That's ok.

    case Token::kTemplateSpan:

    case Token::kTemplateTail:

      break;

    default:

      DCHECK_EQ(token.invalid_template_escape_message, MessageTemplate::kNone);

      break;

  }

}

#endif  // DEBUG


void Scanner::SeekForward(int pos) {

  // After this call, we will have the token at the given position as

  // the "next" token. The "current" token will be invalid.

  if (pos == next().location.beg_pos) return;

  int current_pos = source_pos();

  DCHECK_EQ(next().location.end_pos, current_pos);

  // Positions inside the lookahead token aren't supported.

  DCHECK(pos >= current_pos);

  if (pos != current_pos) {

    source_->Seek(pos);

    Advance();

    // This function is only called to seek to the location

    // of the end of a function (at the "}" token). It doesn't matter

    // whether there was a line terminator in the part we skip.

    next().after_line_terminator = false;

  }

  Scan();

}


template <bool capture_raw>


bool Scanner::ScanEscape() {

  base::uc32 c = c0_;

  Advance<capture_raw>();


  // Skip escaped newlines.

  DCHECK(!unibrow::IsLineTerminator(kEndOfInput));

  if (!capture_raw && unibrow::IsLineTerminator(c)) {

    // Allow escaped CR+LF newlines in multiline string literals.

    if (IsCarriageReturn(c) && IsLineFeed(c0_)) Advance();

    return true;

  }


  switch (c) {

    case 'b' : c = '\b'; break;

    case 'f' : c = '\f'; break;

    case 'n' : c = '\n'; break;

    case 'r' : c = '\r'; break;

    case 't' : c = '\t'; break;

    case 'u' : {

      c = ScanUnicodeEscape<capture_raw>();

      if (IsInvalid(c)) return false;

      break;

    }

    case 'v':

      c = '\v';

      break;

    case 'x': {

      c = ScanHexNumber<capture_raw>(2);

      if (IsInvalid(c)) return false;

      break;

    }

    case '0':

    case '1':

    case '2':

    case '3':

    case '4':

    case '5':

    case '6':

    case '7':

      c = ScanOctalEscape<capture_raw>(c, 2);

      break;

    case '8':

    case '9':

      // '\8' and '\9' are disallowed in strict mode.

      // Reuse the octal error state to propagate the error.

      octal_pos_ = Location(source_pos() - 2, source_pos() - 1);

      octal_message_ = capture_raw ? MessageTemplate::kTemplate8Or9Escape

                                   : MessageTemplate::kStrict8Or9Escape;

      break;

  }


  // Other escaped characters are interpreted as their non-escaped version.

  AddLiteralChar(c);

  return true;

}


template <bool capture_raw>


base::uc32 Scanner::ScanOctalEscape(base::uc32 c, int length) {

  DCHECK('0' <= c && c <= '7');

  base::uc32 x = c - '0';

  int i = 0;

  for (; i < length; i++) {

    int d = c0_ - '0';

    if (d < 0 || d > 7) break;

    int nx = x * 8 + d;

    if (nx >= 256) break;

    x = nx;

    Advance<capture_raw>();

  }

  // Anything except '\0' is an octal escape sequence, illegal in strict mode.

  // Remember the position of octal escape sequences so that an error

  // can be reported later (in strict mode).

  // We don't report the error immediately, because the octal escape can

  // occur before the "use strict" directive.

  if (c != '0' || i > 0 || IsNonOctalDecimalDigit(c0_)) {

    octal_pos_ = Location(source_pos() - i - 1, source_pos() - 1);

    octal_message_ = capture_raw ? MessageTemplate::kTemplateOctalLiteral

                                 : MessageTemplate::kStrictOctalEscape;

  }

  return x;

}


Token::Value Scanner::ScanString() {

  base::uc32 quote = c0_;


  next().literal_chars.Start();

  while (true) {

    AdvanceUntil([this](base::uc32 c0) {

      if (V8_UNLIKELY(static_cast<uint32_t>(c0) > kMaxAscii)) {

        if (V8_UNLIKELY(unibrow::IsStringLiteralLineTerminator(c0))) {

          return true;

        }

        AddLiteralChar(c0);

        return false;

      }

      uint8_t char_flags = character_scan_flags[c0];

      if (MayTerminateString(char_flags)) return true;

      AddLiteralChar(c0);

      return false;

    });


    while (c0_ == '\\') {

      Advance();

      // TODO(verwaest): Check whether we can remove the additional check.

      if (V8_UNLIKELY(c0_ == kEndOfInput || !ScanEscape<false>())) {

        return Token::kIllegal;

      }

    }


    if (c0_ == quote) {

      Advance();

      return Token::kString;

    }


    if (V8_UNLIKELY(c0_ == kEndOfInput ||

                    unibrow::IsStringLiteralLineTerminator(c0_))) {

      return Token::kIllegal;

    }


    AddLiteralChar(c0_);

  }

}


Token::Value Scanner::ScanPrivateName() {

  next().literal_chars.Start();

  DCHECK_EQ(c0_, '#');

  DCHECK(!IsIdentifierStart(kEndOfInput));

  int pos = source_pos();

  Advance();

  if (IsIdentifierStart(c0_) ||

      (CombineSurrogatePair() && IsIdentifierStart(c0_))) {

    AddLiteralChar('#');

    Token::Value token = ScanIdentifierOrKeywordInner();

    return token == Token::kIllegal ? Token::kIllegal : Token::kPrivateName;

  }


  ReportScannerError(pos, MessageTemplate::kInvalidOrUnexpectedToken);

  return Token::kIllegal;

}


Token::Value Scanner::ScanTemplateSpan() {

  // When scanning a TemplateSpan, we are looking for the following construct:

  // kTemplateSpan ::

  //     ` LiteralChars* ${

  //   | } LiteralChars* ${

  //

  // kTemplateTail ::

  //     ` LiteralChars* `

  //   | } LiteralChar* `

  //

  // A kTemplateSpan should always be followed by an Expression, while a

  // kTemplateTail terminates a TemplateLiteral and does not need to be

  // followed by an Expression.


  // These scoped helpers save and restore the original error state, so that we

  // can specially treat invalid escape sequences in templates (which are

  // handled by the parser).

  ErrorState scanner_error_state(&scanner_error_, &scanner_error_location_);

  ErrorState octal_error_state(&octal_message_, &octal_pos_);


  Token::Value result = Token::kTemplateSpan;

  next().literal_chars.Start();

  next().raw_literal_chars.Start();

  const bool capture_raw = true;

  while (true) {

    base::uc32 c = c0_;

    if (c == '`') {

      Advance();  // Consume '`'

      result = Token::kTemplateTail;

      break;

    } else if (c == '$' && Peek() == '{') {

      Advance();  // Consume '$'

      Advance();  // Consume '{'

      break;

    } else if (c == '\\') {

      Advance();  // Consume '\\'

      DCHECK(!unibrow::IsLineTerminator(kEndOfInput));

      if (capture_raw) AddRawLiteralChar('\\');

      if (unibrow::IsLineTerminator(c0_)) {

        // The TV of LineContinuation :: \ LineTerminatorSequence is the empty

        // code unit sequence.

        base::uc32 lastChar = c0_;

        Advance();

        if (lastChar == '\r') {

          // Also skip \n.

          if (c0_ == '\n') Advance();

          lastChar = '\n';

        }

        if (capture_raw) AddRawLiteralChar(lastChar);

      } else {

        bool success = ScanEscape<capture_raw>();

        USE(success);

        DCHECK_EQ(!success, has_error());

        // For templates, invalid escape sequence checking is handled in the

        // parser.

        scanner_error_state.MoveErrorTo(next_);

        octal_error_state.MoveErrorTo(next_);

      }

    } else if (c == kEndOfInput) {

      // Unterminated template literal

      break;

    } else {

      Advance();  // Consume c.

      // The TRV of LineTerminatorSequence :: <CR> is the CV 0x000A.

      // The TRV of LineTerminatorSequence :: <CR><LF> is the sequence

      // consisting of the CV 0x000A.

      if (c == '\r') {

        if (c0_ == '\n') Advance();  // Consume '\n'

        c = '\n';

      }

      if (capture_raw) AddRawLiteralChar(c);

      AddLiteralChar(c);

    }

  }

  next().location.end_pos = source_pos();

  next().token = result;


  return result;

}


template <typename IsolateT>


DirectHandle<String> Scanner::SourceUrl(IsolateT* isolate) const {

  DirectHandle<String> tmp;

  if (source_url_.length() > 0) {

    tmp = source_url_.Internalize(isolate);

  }

  return tmp;

}


template DirectHandle<String> Scanner::SourceUrl(Isolate* isolate) const;

template DirectHandle<String> Scanner::SourceUrl(LocalIsolate* isolate) const;


template <typename IsolateT>


DirectHandle<String> Scanner::SourceMappingUrl(IsolateT* isolate) const {

  DirectHandle<String> tmp;

  if (source_mapping_url_.length() > 0) {

    tmp = source_mapping_url_.Internalize(isolate);

  }

  return tmp;

}


template DirectHandle<String> Scanner::SourceMappingUrl(Isolate* isolate) const;

template DirectHandle<String> Scanner::SourceMappingUrl(

    LocalIsolate* isolate) const;


bool Scanner::ScanDigitsWithNumericSeparators(bool (*predicate)(base::uc32 ch),

                                              bool is_check_first_digit) {

  // we must have at least one digit after 'x'/'b'/'o'

  if (is_check_first_digit && !predicate(c0_)) return false;


  bool separator_seen = false;

  while (predicate(c0_) || c0_ == '_') {

    if (c0_ == '_') {

      Advance();

      if (c0_ == '_') {

        ReportScannerError(Location(source_pos(), source_pos() + 1),

                           MessageTemplate::kContinuousNumericSeparator);

        return false;

      }

      separator_seen = true;

      continue;

    }

    separator_seen = false;

    AddLiteralCharAdvance();

  }


  if (separator_seen) {

    ReportScannerError(Location(source_pos(), source_pos() + 1),

                       MessageTemplate::kTrailingNumericSeparator);

    return false;

  }


  return true;

}


bool Scanner::ScanDecimalDigits(bool allow_numeric_separator) {

  if (allow_numeric_separator) {

    return ScanDigitsWithNumericSeparators(&IsDecimalDigit, false);

  }

  while (IsDecimalDigit(c0_)) {

    AddLiteralCharAdvance();

  }

  if (c0_ == '_') {

    ReportScannerError(Location(source_pos(), source_pos() + 1),

                       MessageTemplate::kInvalidOrUnexpectedToken);

    return false;

  }

  return true;

}


bool Scanner::ScanDecimalAsSmiWithNumericSeparators(uint64_t* value) {

  bool separator_seen = false;

  while (IsDecimalDigit(c0_) || c0_ == '_') {

    if (c0_ == '_') {

      Advance();

      if (c0_ == '_') {

        ReportScannerError(Location(source_pos(), source_pos() + 1),

                           MessageTemplate::kContinuousNumericSeparator);

        return false;

      }

      separator_seen = true;

      continue;

    }

    separator_seen = false;

    *value = 10 * *value + (c0_ - '0');

    base::uc32 first_char = c0_;

    Advance();

    AddLiteralChar(first_char);

  }


  if (separator_seen) {

    ReportScannerError(Location(source_pos(), source_pos() + 1),

                       MessageTemplate::kTrailingNumericSeparator);

    return false;

  }


  return true;

}


bool Scanner::ScanDecimalAsSmi(uint64_t* value, bool allow_numeric_separator) {

  if (allow_numeric_separator) {

    return ScanDecimalAsSmiWithNumericSeparators(value);

  }


  while (IsDecimalDigit(c0_)) {

    *value = 10 * *value + (c0_ - '0');

    base::uc32 first_char = c0_;

    Advance();

    AddLiteralChar(first_char);

  }

  return true;

}


bool Scanner::ScanBinaryDigits() {

  return ScanDigitsWithNumericSeparators(&IsBinaryDigit, true);

}


bool Scanner::ScanOctalDigits() {

  return ScanDigitsWithNumericSeparators(&IsOctalDigit, true);

}


bool Scanner::ScanImplicitOctalDigits(int start_pos,

                                      Scanner::NumberKind* kind) {

  DCHECK_EQ(*kind, IMPLICIT_OCTAL);


  while (true) {

    // (possible) octal number

    if (IsNonOctalDecimalDigit(c0_)) {

      *kind = DECIMAL_WITH_LEADING_ZERO;

      return true;

    }

    if (!IsOctalDigit(c0_)) {

      // Octal literal finished.

      octal_pos_ = Location(start_pos, source_pos());

      octal_message_ = MessageTemplate::kStrictOctalLiteral;

      return true;

    }

    AddLiteralCharAdvance();

  }

}


bool Scanner::ScanHexDigits() {

  return ScanDigitsWithNumericSeparators(&IsHexDigit, true);

}


bool Scanner::ScanSignedInteger() {

  if (c0_ == '+' || c0_ == '-') AddLiteralCharAdvance();

  // we must have at least one decimal digit after 'e'/'E'

  if (!IsDecimalDigit(c0_)) return false;

  return ScanDecimalDigits(true);

}


Token::Value Scanner::ScanNumber(bool seen_period) {

  DCHECK(IsDecimalDigit(c0_));  // the first digit of the number or the fraction


  NumberKind kind = DECIMAL;


  next().literal_chars.Start();

  bool at_start = !seen_period;

  int start_pos = source_pos();  // For reporting octal positions.

  if (seen_period) {

    // we have already seen a decimal point of the float

    AddLiteralChar('.');

    if (c0_ == '_') {

      return Token::kIllegal;

    }

    // we know we have at least one digit

    if (!ScanDecimalDigits(true)) return Token::kIllegal;

  } else {

    // if the first character is '0' we must check for octals and hex

    if (c0_ == '0') {

      AddLiteralCharAdvance();


      // either 0, 0exxx, 0Exxx, 0.xxx, a hex number, a binary number or

      // an octal number.

      if (AsciiAlphaToLower(c0_) == 'x') {

        AddLiteralCharAdvance();

        kind = HEX;

        if (!ScanHexDigits()) return Token::kIllegal;

      } else if (AsciiAlphaToLower(c0_) == 'o') {

        AddLiteralCharAdvance();

        kind = OCTAL;

        if (!ScanOctalDigits()) return Token::kIllegal;

      } else if (AsciiAlphaToLower(c0_) == 'b') {

        AddLiteralCharAdvance();

        kind = BINARY;

        if (!ScanBinaryDigits()) return Token::kIllegal;

      } else if (IsOctalDigit(c0_)) {

        kind = IMPLICIT_OCTAL;

        if (!ScanImplicitOctalDigits(start_pos, &kind)) {

          return Token::kIllegal;

        }

        if (kind == DECIMAL_WITH_LEADING_ZERO) {

          at_start = false;

        }

      } else if (IsNonOctalDecimalDigit(c0_)) {

        kind = DECIMAL_WITH_LEADING_ZERO;

      } else if (c0_ == '_') {

        ReportScannerError(Location(source_pos(), source_pos() + 1),

                           MessageTemplate::kZeroDigitNumericSeparator);

        return Token::kIllegal;

      }

    }


    // Parse decimal digits and allow trailing fractional part.

    if (IsDecimalNumberKind(kind)) {

      bool allow_numeric_separator = kind != DECIMAL_WITH_LEADING_ZERO;

      // This is an optimization for parsing Decimal numbers as Smi's.

      if (at_start) {

        uint64_t value = 0;

        // scan subsequent decimal digits

        if (!ScanDecimalAsSmi(&value, allow_numeric_separator)) {

          return Token::kIllegal;

        }


        if (next().literal_chars.one_byte_literal().length() <= 10 &&

            value <= Smi::kMaxValue && c0_ != '.' && !IsIdentifierStart(c0_)) {

          next().smi_value = static_cast<uint32_t>(value);


          if (kind == DECIMAL_WITH_LEADING_ZERO) {

            octal_pos_ = Location(start_pos, source_pos());

            octal_message_ = MessageTemplate::kStrictDecimalWithLeadingZero;

          }

          return Token::kSmi;

        }

      }


      if (!ScanDecimalDigits(allow_numeric_separator)) {

        return Token::kIllegal;

      }

      if (c0_ == '.') {

        seen_period = true;

        AddLiteralCharAdvance();

        if (c0_ == '_') {

          return Token::kIllegal;

        }

        if (!ScanDecimalDigits(true)) return Token::kIllegal;

      }

    }

  }


  bool is_bigint = false;

  if (c0_ == 'n' && !seen_period && IsValidBigIntKind(kind)) {

    // Check that the literal is within our limits for BigInt length.

    // For simplicity, use 4 bits per character to calculate the maximum

    // allowed literal length.

    static const int kMaxBigIntCharacters = BigInt::kMaxLengthBits / 4;

    int length = source_pos() - start_pos - (kind != DECIMAL ? 2 : 0);

    if (length > kMaxBigIntCharacters) {

      ReportScannerError(Location(start_pos, source_pos()),

                         MessageTemplate::kBigIntTooBig);

      return Token::kIllegal;

    }


    is_bigint = true;

    Advance();

  } else if (AsciiAlphaToLower(c0_) == 'e') {

    // scan exponent, if any

    DCHECK_NE(kind, HEX);  // 'e'/'E' must be scanned as part of the hex number


    if (!IsDecimalNumberKind(kind)) return Token::kIllegal;


    // scan exponent

    AddLiteralCharAdvance();


    if (!ScanSignedInteger()) return Token::kIllegal;

  }


  // The source character immediately following a numeric literal must

  // not be an identifier start or a decimal digit; see ECMA-262

  // section 7.8.3, page 17 (note that we read only one decimal digit

  // if the value is 0).

  if (IsDecimalDigit(c0_) || IsIdentifierStart(c0_)) {

    return Token::kIllegal;

  }


  if (kind == DECIMAL_WITH_LEADING_ZERO) {

    octal_pos_ = Location(start_pos, source_pos());

    octal_message_ = MessageTemplate::kStrictDecimalWithLeadingZero;

  }


  next().number_kind = kind;

  return is_bigint ? Token::kBigInt : Token::kNumber;

}


base::uc32 Scanner::ScanIdentifierUnicodeEscape() {

  Advance();

  if (c0_ != 'u') return Invalid();

  Advance();

  return ScanUnicodeEscape<false>();

}


template <bool capture_raw>


base::uc32 Scanner::ScanUnicodeEscape() {

  // Accept both \uxxxx and \u{xxxxxx}. In the latter case, the number of

  // hex digits between { } is arbitrary. \ and u have already been read.

  if (c0_ == '{') {

    int begin = source_pos() - 2;

    Advance<capture_raw>();

    base::uc32 cp =

        ScanUnlimitedLengthHexNumber<capture_raw>(String::kMaxCodePoint, begin);

    if (cp == kInvalidSequence || c0_ != '}') {

      ReportScannerError(source_pos(),

                         MessageTemplate::kInvalidUnicodeEscapeSequence);

      return Invalid();

    }

    Advance<capture_raw>();

    return cp;

  }

  const bool unicode = true;

  return ScanHexNumber<capture_raw, unicode>(4);

}


Token::Value Scanner::ScanIdentifierOrKeywordInnerSlow(bool escaped,

                                                       bool can_be_keyword) {

  while (true) {

    if (c0_ == '\\') {

      escaped = true;

      base::uc32 c = ScanIdentifierUnicodeEscape();

      // Only allow legal identifier part characters.

      // TODO(verwaest): Make this true.

      // DCHECK(!IsIdentifierPart('\'));

      DCHECK(!IsIdentifierPart(Invalid()));

      if (c == '\\' || !IsIdentifierPart(c)) {

        return Token::kIllegal;

      }

      can_be_keyword = can_be_keyword && CharCanBeKeyword(c);

      AddLiteralChar(c);

    } else if (IsIdentifierPart(c0_) ||

               (CombineSurrogatePair() && IsIdentifierPart(c0_))) {

      can_be_keyword = can_be_keyword && CharCanBeKeyword(c0_);

      AddLiteralCharAdvance();

    } else {

      break;

    }

  }


  if (can_be_keyword && next().literal_chars.is_one_byte()) {

    base::Vector<const uint8_t> chars = next().literal_chars.one_byte_literal();

    Token::Value token =

        KeywordOrIdentifierToken(chars.begin(), chars.length());

    if (base::IsInRange(token, Token::kIdentifier, Token::kYield)) return token;


    if (token == Token::kFutureStrictReservedWord) {

      if (escaped) return Token::kEscapedStrictReservedWord;

      return token;

    }


    if (!escaped) return token;


    static_assert(Token::kLet + 1 == Token::kStatic);

    if (base::IsInRange(token, Token::kLet, Token::kStatic)) {

      return Token::kEscapedStrictReservedWord;

    }

    return Token::kEscapedKeyword;

  }


  return Token::kIdentifier;

}


bool Scanner::ScanRegExpPattern() {

  DCHECK_EQ(Token::kUninitialized, next_next().token);

  DCHECK(next().token == Token::kDiv || next().token == Token::kAssignDiv);


  // Scan: ('/' | '/=') RegularExpressionBody '/' RegularExpressionFlags

  bool in_character_class = false;


  // Scan regular expression body: According to ECMA-262, 3rd, 7.8.5,

  // the scanner should pass uninterpreted bodies to the RegExp

  // constructor.

  next().literal_chars.Start();

  if (next().token == Token::kAssignDiv) {

    AddLiteralChar('=');

  }


  while (c0_ != '/' || in_character_class) {

    if (c0_ == kEndOfInput || unibrow::IsLineTerminator(c0_)) {

      return false;

    }

    if (c0_ == '\\') {  // Escape sequence.

      AddLiteralCharAdvance();

      if (c0_ == kEndOfInput || unibrow::IsLineTerminator(c0_)) {

        return false;

      }

      AddLiteralCharAdvance();

      // If the escape allows more characters, i.e., \x??, \u????, or \c?,

      // only "safe" characters are allowed (letters, digits, underscore),

      // otherwise the escape isn't valid and the invalid character has

      // its normal meaning. I.e., we can just continue scanning without

      // worrying whether the following characters are part of the escape

      // or not, since any '/', '\\' or '[' is guaranteed to not be part

      // of the escape sequence.

    } else {  // Unescaped character.

      if (c0_ == '[') in_character_class = true;

      if (c0_ == ']') in_character_class = false;

      AddLiteralCharAdvance();

    }

  }

  Advance();  // consume '/'


  next().token = Token::kRegExpLiteral;

  return true;

}


std::optional<RegExpFlags> Scanner::ScanRegExpFlags() {

  DCHECK_EQ(Token::kRegExpLiteral, next().token);


  RegExpFlags flags;

  next().literal_chars.Start();

  while (IsIdentifierPart(c0_)) {

    std::optional<RegExpFlag> maybe_flag = JSRegExp::FlagFromChar(c0_);

    if (!maybe_flag.has_value()) return {};

    RegExpFlag flag = maybe_flag.value();

    if (flags & flag) return {};

    AddLiteralCharAdvance();

    flags |= flag;

  }


  next().location.end_pos = source_pos();

  return flags;

}


const AstRawString* Scanner::CurrentSymbol(

    AstValueFactory* ast_value_factory) const {

  if (is_literal_one_byte()) {

    return ast_value_factory->GetOneByteString(literal_one_byte_string());

  }

  return ast_value_factory->GetTwoByteString(literal_two_byte_string());

}


const AstRawString* Scanner::NextSymbol(

    AstValueFactory* ast_value_factory) const {

  if (is_next_literal_one_byte()) {

    return ast_value_factory->GetOneByteString(next_literal_one_byte_string());

  }

  return ast_value_factory->GetTwoByteString(next_literal_two_byte_string());

}


const AstRawString* Scanner::CurrentRawSymbol(

    AstValueFactory* ast_value_factory) const {

  if (is_raw_literal_one_byte()) {

    return ast_value_factory->GetOneByteString(raw_literal_one_byte_string());

  }

  return ast_value_factory->GetTwoByteString(raw_literal_two_byte_string());

}


double Scanner::DoubleValue() {

  DCHECK(is_literal_one_byte());

  switch (current().number_kind) {

    case IMPLICIT_OCTAL:

      return ImplicitOctalStringToDouble(literal_one_byte_string());

    case BINARY:

      return BinaryStringToDouble(literal_one_byte_string());

    case OCTAL:

      return OctalStringToDouble(literal_one_byte_string());

    case HEX:

      return HexStringToDouble(literal_one_byte_string());

    case DECIMAL:

    case DECIMAL_WITH_LEADING_ZERO:

      return StringToDouble(literal_one_byte_string(), NO_CONVERSION_FLAG);

  }

}


const char* Scanner::CurrentLiteralAsCString(Zone* zone) const {

  DCHECK(is_literal_one_byte());

  base::Vector<const uint8_t> vector = literal_one_byte_string();

  int length = vector.length();

  char* buffer = zone->AllocateArray<char>(length + 1);

  memcpy(buffer, vector.begin(), length);

  buffer[length] = '\0';

  return buffer;

}


void Scanner::SeekNext(size_t position) {

  // Use with care: This cleanly resets most, but not all scanner state.

  // TODO(vogelheim): Fix this, or at least DCHECK the relevant conditions.


  // To re-scan from a given character position, we need to:

  // 1, Reset the current_, next_ and next_next_ tokens

  //    (next_ + next_next_ will be overwrittem by Next(),

  //     current_ will remain unchanged, so overwrite it fully.)

  for (TokenDesc& token : token_storage_) {

    token.token = Token::kUninitialized;

    token.invalid_template_escape_message = MessageTemplate::kNone;

  }

  // 2, reset the source to the desired position,

  source_->Seek(position);

  // 3, re-scan, by scanning the look-ahead char + 1 token (next_).

  c0_ = source_->Advance();

  next().after_line_terminator = false;

  Scan();

  DCHECK_EQ(next().location.beg_pos, static_cast<int>(position));

}


}  // namespace v8::internal

ast-value-factory.h

kind
Builtins::Kind kind
Definition builtins.cc:40

pos
SourcePosition pos
Definition class-debug-reader-generator.cc:34

v8::base::Flags< RegExpFlag >

v8::base::Vector
Definition zone-list.h:15

v8::base::Vector::length
int length() const
Definition vector.h:64

v8::base::Vector::begin
constexpr T * begin() const
Definition vector.h:96

v8::internal::AstRawString
Definition ast-value-factory.h:51

v8::internal::AstValueFactory
Definition ast-value-factory.h:339

v8::internal::AstValueFactory::GetOneByteString
const AstRawString * GetOneByteString(base::Vector< const uint8_t > literal)
Definition ast-value-factory.h:376

v8::internal::AstValueFactory::GetTwoByteString
const AstRawString * GetTwoByteString(base::Vector< const uint16_t > literal)
Definition ast-value-factory.h:382

v8::internal::BigIntBase::kMaxLengthBits
static const uint32_t kMaxLengthBits
Definition bigint.h:105

v8::internal::DirectHandle
Definition handles.h:659

v8::internal::Isolate
Definition isolate.h:586

v8::internal::JSRegExp::FlagFromChar
static std::optional< RegExpFlag > FlagFromChar(char c)
Definition js-regexp.h:61

v8::internal::LiteralBuffer
Definition literal-buffer.h:17

v8::internal::LiteralBuffer::Start
void Start()
Definition literal-buffer.h:67

v8::internal::LiteralBuffer::length
int length() const
Definition literal-buffer.h:65

v8::internal::LiteralBuffer::Internalize
DirectHandle< String > Internalize(IsolateT *isolate) const
Definition literal-buffer.cc:17

v8::internal::LiteralBuffer::is_one_byte
bool is_one_byte() const
Definition literal-buffer.h:41

v8::internal::LiteralBuffer::one_byte_literal
base::Vector< const uint8_t > one_byte_literal() const
Definition literal-buffer.h:52

v8::internal::LocalIsolate
Definition local-isolate.h:45

v8::internal::Scanner::BookmarkScope::bookmark_
size_t bookmark_
Definition scanner.h:240

v8::internal::Scanner::BookmarkScope::kNoBookmark
static const size_t kNoBookmark
Definition scanner.h:236

v8::internal::Scanner::BookmarkScope::HasBeenSet
bool HasBeenSet() const
Definition scanner.cc:85

v8::internal::Scanner::BookmarkScope::kBookmarkWasApplied
static const size_t kBookmarkWasApplied
Definition scanner.h:237

v8::internal::Scanner::BookmarkScope::HasBeenApplied
bool HasBeenApplied() const
Definition scanner.cc:89

v8::internal::Scanner::BookmarkScope::Apply
void Apply()
Definition scanner.cc:74

v8::internal::Scanner::BookmarkScope::Set
void Set(size_t bookmark)
Definition scanner.cc:69

v8::internal::Scanner::ErrorState
Definition scanner.cc:26

v8::internal::Scanner::ErrorState::ErrorState
ErrorState(MessageTemplate *message_stack, Scanner::Location *location_stack)
Definition scanner.cc:28

v8::internal::Scanner::ErrorState::message_stack_
MessageTemplate *const message_stack_
Definition scanner.cc:55

v8::internal::Scanner::ErrorState::MoveErrorTo
void MoveErrorTo(TokenDesc *dest)
Definition scanner.cc:42

v8::internal::Scanner::ErrorState::location_stack_
Scanner::Location *const location_stack_
Definition scanner.cc:57

v8::internal::Scanner::ErrorState::old_message_
MessageTemplate const old_message_
Definition scanner.cc:56

v8::internal::Scanner::ErrorState::~ErrorState
~ErrorState()
Definition scanner.cc:37

v8::internal::Scanner::ErrorState::old_location_
Scanner::Location const old_location_
Definition scanner.cc:58

v8::internal::Scanner::AddLiteralCharAdvance
V8_INLINE void AddLiteralCharAdvance()
Definition scanner.h:545

v8::internal::Scanner::SeekForward
void SeekForward(int pos)
Definition scanner.cc:448

v8::internal::Scanner::Next
Token::Value Next()
Definition scanner.cc:162

v8::internal::Scanner::octal_message_
MessageTemplate octal_message_
Definition scanner.h:775

v8::internal::Scanner::literal_two_byte_string
base::Vector< const uint16_t > literal_two_byte_string() const
Definition scanner.h:620

v8::internal::Scanner::ScanIdentifierOrKeywordInner
V8_INLINE Token::Value ScanIdentifierOrKeywordInner()
Definition scanner-inl.h:265

v8::internal::Scanner::IsValidBigIntKind
bool IsValidBigIntKind(NumberKind kind)
Definition scanner.h:490

v8::internal::Scanner::raw_literal_two_byte_string
base::Vector< const uint16_t > raw_literal_two_byte_string() const
Definition scanner.h:648

v8::internal::Scanner::current_
TokenDesc * current_
Definition scanner.h:747

v8::internal::Scanner::next_next_next_
TokenDesc * next_next_next_
Definition scanner.h:750

v8::internal::Scanner::SkipMagicComment
Token::Value SkipMagicComment(base::uc32 hash_or_at_sign)
Definition scanner.cc:245

v8::internal::Scanner::IsInvalid
static bool IsInvalid(base::uc32 c)
Definition scanner.cc:114

v8::internal::Scanner::ScanBinaryDigits
bool ScanBinaryDigits()
Definition scanner.cc:801

v8::internal::Scanner::ScanHexDigits
bool ScanHexDigits()
Definition scanner.cc:829

v8::internal::Scanner::kInvalidSequence
static constexpr base::uc32 kInvalidSequence
Definition scanner.h:278

v8::internal::Scanner::next_next
const TokenDesc & next_next() const
Definition scanner.h:742

v8::internal::Scanner::PushBack
void PushBack(base::uc32 ch)
Definition scanner.h:578

v8::internal::Scanner::AddLiteralChar
V8_INLINE void AddLiteralChar(base::uc32 c)
Definition scanner.h:535

v8::internal::Scanner::ScanIdentifierOrKeywordInnerSlow
Token::Value ScanIdentifierOrKeywordInnerSlow(bool escaped, bool can_be_keyword)
Definition scanner.cc:1001

v8::internal::Scanner::IsDecimalNumberKind
bool IsDecimalNumberKind(NumberKind kind)
Definition scanner.h:494

v8::internal::Scanner::ScanSignedInteger
bool ScanSignedInteger()
Definition scanner.cc:833

v8::internal::Scanner::ScanUnicodeEscape
base::uc32 ScanUnicodeEscape()
Definition scanner.cc:981

v8::internal::Scanner::CombineSurrogatePair
bool CombineSurrogatePair()
Definition scanner.h:564

v8::internal::Scanner::ScanOctalEscape
base::uc32 ScanOctalEscape(base::uc32 c, int length)
Definition scanner.cc:525

v8::internal::Scanner::ScanString
Token::Value ScanString()
Definition scanner.cc:550

v8::internal::Scanner::ScanTemplateSpan
Token::Value ScanTemplateSpan()
Definition scanner.cc:608

v8::internal::Scanner::CurrentSymbol
const AstRawString * CurrentSymbol(AstValueFactory *ast_value_factory) const
Definition scanner.cc:1110

v8::internal::Scanner::literal_one_byte_string
base::Vector< const uint8_t > literal_one_byte_string() const
Definition scanner.h:615

v8::internal::Scanner::ScanNumber
Token::Value ScanNumber(bool seen_period)
Definition scanner.cc:840

v8::internal::Scanner::found_html_comment_
bool found_html_comment_
Definition scanner.h:762

v8::internal::Scanner::source_mapping_url_
LiteralBuffer source_mapping_url_
Definition scanner.h:766

v8::internal::Scanner::location
const Location & location() const
Definition scanner.h:298

v8::internal::Scanner::CurrentLiteralAsCString
const char * CurrentLiteralAsCString(Zone *zone) const
Definition scanner.cc:1152

v8::internal::Scanner::next_literal_one_byte_string
base::Vector< const uint8_t > next_literal_one_byte_string() const
Definition scanner.h:632

v8::internal::Scanner::SkipMultiLineComment
Token::Value SkipMultiLineComment()
Definition scanner.cc:370

v8::internal::Scanner::Scan
V8_INLINE void Scan()
Definition scanner-inl.h:575

v8::internal::Scanner::SourceMappingUrl
DirectHandle< String > SourceMappingUrl(IsolateT *isolate) const
Definition scanner.cc:701

v8::internal::Scanner::PeekAhead
Token::Value PeekAhead()
Definition scanner.cc:193

v8::internal::Scanner::SkipSingleHTMLComment
Token::Value SkipSingleHTMLComment()
Definition scanner.cc:226

v8::internal::Scanner::AddRawLiteralChar
V8_INLINE void AddRawLiteralChar(base::uc32 c)
Definition scanner.h:541

v8::internal::Scanner::source_
Utf16CharacterStream *const source_
Definition scanner.h:754

v8::internal::Scanner::CurrentRawSymbol
const AstRawString * CurrentRawSymbol(AstValueFactory *ast_value_factory) const
Definition scanner.cc:1126

v8::internal::Scanner::ScanOctalDigits
bool ScanOctalDigits()
Definition scanner.cc:805

v8::internal::Scanner::octal_pos_
Location octal_pos_
Definition scanner.h:774

v8::internal::Scanner::next_
TokenDesc * next_
Definition scanner.h:748

v8::internal::Scanner::next_literal_two_byte_string
base::Vector< const uint16_t > next_literal_two_byte_string() const
Definition scanner.h:636

v8::internal::Scanner::Advance
void Advance()
Definition scanner.h:552

v8::internal::Scanner::ScanDecimalAsSmiWithNumericSeparators
bool ScanDecimalAsSmiWithNumericSeparators(uint64_t *value)
Definition scanner.cc:758

v8::internal::Scanner::DoubleValue
double DoubleValue()
Definition scanner.cc:1135

v8::internal::Scanner::raw_literal_one_byte_string
base::Vector< const uint8_t > raw_literal_one_byte_string() const
Definition scanner.h:644

v8::internal::Scanner::AdvanceUntil
V8_INLINE void AdvanceUntil(FunctionType check)
Definition scanner.h:560

v8::internal::Scanner::NumberKind
NumberKind
Definition scanner.h:453

v8::internal::Scanner::OCTAL
@ OCTAL
Definition scanner.h:456

v8::internal::Scanner::DECIMAL
@ DECIMAL
Definition scanner.h:458

v8::internal::Scanner::IMPLICIT_OCTAL
@ IMPLICIT_OCTAL
Definition scanner.h:454

v8::internal::Scanner::DECIMAL_WITH_LEADING_ZERO
@ DECIMAL_WITH_LEADING_ZERO
Definition scanner.h:459

v8::internal::Scanner::BINARY
@ BINARY
Definition scanner.h:455

v8::internal::Scanner::HEX
@ HEX
Definition scanner.h:457

v8::internal::Scanner::c0_
base::uc32 c0_
Definition scanner.h:757

v8::internal::Scanner::PeekAheadAhead
Token::Value PeekAheadAhead()
Definition scanner.cc:209

v8::internal::Scanner::is_next_literal_one_byte
bool is_next_literal_one_byte() const
Definition scanner.h:640

v8::internal::Scanner::ScanUnlimitedLengthHexNumber
base::uc32 ScanUnlimitedLengthHexNumber(base::uc32 max_value, int beg_pos)
Definition scanner.cc:142

v8::internal::Scanner::token_storage_
TokenDesc token_storage_[4]
Definition scanner.h:759

v8::internal::Scanner::ScanEscape
bool ScanEscape()
Definition scanner.cc:468

v8::internal::Scanner::flags_
UnoptimizedCompileFlags flags_
Definition scanner.h:745

v8::internal::Scanner::Scanner
Scanner(Utf16CharacterStream *source, UnoptimizedCompileFlags flags)
Definition scanner.cc:96

v8::internal::Scanner::has_error
bool has_error() const
Definition scanner.h:301

v8::internal::Scanner::saw_non_comment_
bool saw_non_comment_
Definition scanner.h:769

v8::internal::Scanner::source_url_
LiteralBuffer source_url_
Definition scanner.h:765

v8::internal::Scanner::SourceUrl
DirectHandle< String > SourceUrl(IsolateT *isolate) const
Definition scanner.cc:689

v8::internal::Scanner::next
TokenDesc & next()
Definition scanner.h:738

v8::internal::Scanner::source_pos
int source_pos()
Definition scanner.h:720

v8::internal::Scanner::Peek
base::uc32 Peek() const
Definition scanner.h:585

v8::internal::Scanner::ScanIdentifierUnicodeEscape
base::uc32 ScanIdentifierUnicodeEscape()
Definition scanner.cc:973

v8::internal::Scanner::scanner_error_
MessageTemplate scanner_error_
Definition scanner.h:777

v8::internal::Scanner::is_raw_literal_one_byte
bool is_raw_literal_one_byte() const
Definition scanner.h:652

v8::internal::Scanner::ScanDigitsWithNumericSeparators
bool ScanDigitsWithNumericSeparators(bool(*predicate)(base::uc32 ch), bool is_check_first_digit)
Definition scanner.cc:713

v8::internal::Scanner::kEndOfInput
static constexpr base::uc32 kEndOfInput
Definition scanner.h:277

v8::internal::Scanner::Initialize
void Initialize()
Definition scanner.cc:105

v8::internal::Scanner::ScanRegExpFlags
std::optional< RegExpFlags > ScanRegExpFlags()
Definition scanner.cc:1092

v8::internal::Scanner::next_next_next
const TokenDesc & next_next_next() const
Definition scanner.h:743

v8::internal::Scanner::per_function_compile_hint_positions_
std::vector< int > per_function_compile_hint_positions_
Definition scanner.h:770

v8::internal::Scanner::NextSymbol
const AstRawString * NextSymbol(AstValueFactory *ast_value_factory) const
Definition scanner.cc:1118

v8::internal::Scanner::scanner_error_location_
Location scanner_error_location_
Definition scanner.h:778

v8::internal::Scanner::Init
void Init()
Definition scanner.h:506

v8::internal::Scanner::ScanImplicitOctalDigits
bool ScanImplicitOctalDigits(int start_pos, NumberKind *kind)
Definition scanner.cc:809

v8::internal::Scanner::SkipSingleLineComment
Token::Value SkipSingleLineComment()
Definition scanner.cc:234

v8::internal::Scanner::kMaxAscii
static const int kMaxAscii
Definition scanner.h:499

v8::internal::Scanner::ScanRegExpPattern
bool ScanRegExpPattern()
Definition scanner.cc:1048

v8::internal::Scanner::saw_source_mapping_url_magic_comment_at_sign_
bool saw_source_mapping_url_magic_comment_at_sign_
Definition scanner.h:767

v8::internal::Scanner::HasPerFunctionCompileHint
bool HasPerFunctionCompileHint(int position)
Definition scanner.cc:348

v8::internal::Scanner::ScanHexNumber
base::uc32 ScanHexNumber(int expected_length)
Definition scanner.cc:120

v8::internal::Scanner::is_literal_one_byte
bool is_literal_one_byte() const
Definition scanner.h:625

v8::internal::Scanner::per_function_compile_hint_positions_idx_
size_t per_function_compile_hint_positions_idx_
Definition scanner.h:771

v8::internal::Scanner::saw_magic_comment_compile_hints_all_
bool saw_magic_comment_compile_hints_all_
Definition scanner.h:768

v8::internal::Scanner::next_next_
TokenDesc * next_next_
Definition scanner.h:749

v8::internal::Scanner::SeekNext
void SeekNext(size_t position)
Definition scanner.cc:1162

v8::internal::Scanner::ScanDecimalAsSmi
bool ScanDecimalAsSmi(uint64_t *value, bool allow_numeric_separator)
Definition scanner.cc:787

v8::internal::Scanner::Invalid
static constexpr base::uc32 Invalid()
Definition scanner.h:280

v8::internal::Scanner::ScanHtmlComment
Token::Value ScanHtmlComment()
Definition scanner.cc:415

v8::internal::Scanner::ScanPrivateName
Token::Value ScanPrivateName()
Definition scanner.cc:591

v8::internal::Scanner::TryToParseMagicComment
void TryToParseMagicComment(base::uc32 hash_or_at_sign)
Definition scanner.cc:279

v8::internal::Scanner::ReportScannerError
void ReportScannerError(const Location &location, MessageTemplate error)
Definition scanner.h:520

v8::internal::Scanner::ScanDecimalDigits
bool ScanDecimalDigits(bool allow_numeric_separator)
Definition scanner.cc:743

v8::internal::Scanner::current
const TokenDesc & current() const
Definition scanner.h:740

v8::internal::Smi::kMaxValue
static constexpr int kMaxValue
Definition smi.h:101

v8::internal::String::kMaxCodePoint
static const base::uc32 kMaxCodePoint
Definition string.h:504

v8::internal::Token::Value
Value
Definition token.h:215

v8::internal::UnoptimizedCompileFlags
Definition parse-info.h:70

v8::internal::Utf16CharacterStream
Definition scanner.h:40

v8::internal::Utf16CharacterStream::Seek
void Seek(size_t pos)
Definition scanner.h:115

v8::internal::Utf16CharacterStream::Advance
base::uc32 Advance()
Definition scanner.h:67

v8::internal::Zone
Definition zone.h:43

v8::internal::Zone::AllocateArray
T * AllocateArray(size_t length)
Definition zone.h:127

conversions-inl.h

conversions.h

previous
LineAndColumn previous
Definition earley-parser.cc:21

result
ZoneVector< RpoNumber > & result
Definition jump-threading.cc:21

tmp
Register tmp
Definition liftoff-compiler.cc:7526

x
int x
Definition liveedit-diff.cc:60

position
int position
Definition liveedit.cc:290

unibrow::IsStringLiteralLineTerminator
V8_INLINE bool IsStringLiteralLineTerminator(uchar c)
Definition unicode.h:271

unibrow::IsLineTerminator
V8_INLINE bool IsLineTerminator(uchar c)
Definition unicode.h:267

v8::base::uc32
uint32_t uc32
Definition strings.h:19

v8::base::HexValue
int HexValue(uc32 c)
Definition strings.h:34

v8::base::StaticOneByteVector
Vector< const uint8_t > StaticOneByteVector(const char(&array)[N])
Definition vector.h:346

v8::base::IsInRange
constexpr bool IsInRange(T value, U lower_limit, U higher_limit)
Definition bounds.h:20

v8::base::VLQBase64Decode
int32_t VLQBase64Decode(const char *start, size_t sz, size_t *pos)
Definition vlq-base64.cc:37

v8::internal
Definition api-arguments-inl.h:20

v8::internal::IsIdentifierStart
bool IsIdentifierStart(base::uc32 c)
Definition char-predicates-inl.h:137

v8::internal::IsHexDigit
constexpr bool IsHexDigit(base::uc32 c)
Definition char-predicates-inl.h:39

v8::internal::RegExpFlag
RegExpFlag
Definition regexp-flags.h:33

v8::internal::MessageTemplate
MessageTemplate
Definition message-template.h:766

v8::internal::OctalStringToDouble
double OctalStringToDouble(base::Vector< const uint8_t > str)
Definition conversions.cc:788

v8::internal::HexStringToDouble
double HexStringToDouble(base::Vector< const uint8_t > str)
Definition conversions.cc:794

v8::internal::IsCarriageReturn
constexpr bool IsCarriageReturn(base::uc32 c)
Definition char-predicates-inl.h:22

v8::internal::IsWhiteSpaceOrLineTerminator
bool IsWhiteSpaceOrLineTerminator(base::uc32 c)
Definition char-predicates-inl.h:158

v8::internal::CharCanBeKeyword
bool CharCanBeKeyword(base::uc32 c)
Definition scanner-inl.h:260

v8::internal::name
too high values may cause the compiler to set high thresholds for inlining to as much as possible avoid inlined allocation of objects that cannot escape trace load stores from virtual maglev objects use TurboFan fast string builder analyze liveness of environment slots and zap dead values trace TurboFan load elimination emit data about basic block usage in builtins to this enable builtin reordering when run mksnapshot flag for emit warnings when applying builtin profile data verify register allocation in TurboFan randomly schedule instructions to stress dependency tracking enable store store elimination in TurboFan rewrite far to near simulate GC compiler thread race related to allow float parameters to be passed in simulator mode JS Wasm Run additional turbo_optimize_inlined_js_wasm_wrappers enable experimental feedback collection in generic lowering enable Turboshaft s WasmLoadElimination enable Turboshaft s low level load elimination for JS enable Turboshaft s escape analysis for string concatenation use enable Turbolev features that we want to ship in the not too far future trace individual Turboshaft reduction steps trace intermediate Turboshaft reduction steps invocation count threshold for early optimization Enables optimizations which favor memory size over execution speed Enables sampling allocation profiler with X as a sample interval min size of a semi the new space consists of two semi spaces max size of the Collect garbage after Collect garbage after keeps maps alive for< n > old space garbage collections print one detailed trace line in name
Definition flags.cc:2086

v8::internal::flags
Flag flags[]
Definition flags.cc:3797

v8::internal::ImplicitOctalStringToDouble
double ImplicitOctalStringToDouble(base::Vector< const uint8_t > str)
Definition conversions.cc:800

v8::internal::character_scan_flags
static constexpr const uint8_t character_scan_flags[128]
Definition scanner-inl.h:254

v8::internal::IsOctalDigit
constexpr bool IsOctalDigit(base::uc32 c)
Definition char-predicates-inl.h:44

v8::internal::BinaryStringToDouble
double BinaryStringToDouble(base::Vector< const uint8_t > str)
Definition conversions.cc:782

v8::internal::IsNonOctalDecimalDigit
constexpr bool IsNonOctalDecimalDigit(base::uc32 c)
Definition char-predicates-inl.h:49

v8::internal::BranchTargetIdentifier::kNone
@ kNone

v8::internal::MayTerminateString
bool MayTerminateString(uint8_t scan_flags)
Definition scanner-inl.h:249

v8::internal::IsWhiteSpace
bool IsWhiteSpace(base::uc32 c)
Definition char-predicates-inl.h:151

v8::internal::IsDecimalDigit
constexpr bool IsDecimalDigit(base::uc32 c)
Definition char-predicates-inl.h:34

v8::internal::NO_CONVERSION_FLAG
@ NO_CONVERSION_FLAG
Definition conversions.h:149

v8::internal::KeywordOrIdentifierToken
V8_INLINE Token::Value KeywordOrIdentifierToken(const uint8_t *input, int input_length)
Definition scanner-inl.h:101

v8::internal::MultilineCommentCharacterNeedsSlowPath
bool MultilineCommentCharacterNeedsSlowPath(uint8_t scan_flags)
Definition scanner-inl.h:245

v8::internal::IsBinaryDigit
constexpr bool IsBinaryDigit(base::uc32 c)
Definition char-predicates-inl.h:53

v8::internal::IsLineFeed
constexpr bool IsLineFeed(base::uc32 c)
Definition char-predicates-inl.h:24

v8::internal::value
return value
Definition map-inl.h:893

v8::internal::AsciiAlphaToLower
constexpr int AsciiAlphaToLower(base::uc32 c)
Definition char-predicates-inl.h:20

v8::internal::cp
constexpr Register cp
Definition register-arm.h:330

v8::internal::IsIdentifierPart
bool IsIdentifierPart(base::uc32 c)
Definition char-predicates-inl.h:144

v8::internal::StringToDouble
double StringToDouble(const char *str, ConversionFlag flags, double empty_string_val)
Definition conversions.cc:762

v8::internal::length
size_t length
Definition external-reference.cc:1491

bigint.h

parse-info.h

scanner-inl.h

scanner.h

DCHECK_LE
#define DCHECK_LE(v1, v2)
Definition logging.h:490

DCHECK_NOT_NULL
#define DCHECK_NOT_NULL(val)
Definition logging.h:492

DCHECK_NE
#define DCHECK_NE(v1, v2)
Definition logging.h:486

DCHECK
#define DCHECK(condition)
Definition logging.h:482

DCHECK_EQ
#define DCHECK_EQ(v1, v2)
Definition logging.h:485

USE
#define USE(...)
Definition macros.h:293

strings.h

v8::internal::Scanner::Location
Definition scanner.h:263

v8::internal::Scanner::Location::end_pos
int end_pos
Definition scanner.h:273

v8::internal::Scanner::Location::invalid
static Location invalid()
Definition scanner.h:270

v8::internal::Scanner::TokenDesc
Definition scanner.h:463

v8::internal::Scanner::TokenDesc::token
Token::Value token
Definition scanner.h:467

v8::internal::Scanner::TokenDesc::smi_value
uint32_t smi_value
Definition scanner.h:471

v8::internal::Scanner::TokenDesc::invalid_template_escape_location
Location invalid_template_escape_location
Definition scanner.h:469

v8::internal::Scanner::TokenDesc::location
Location location
Definition scanner.h:464

v8::internal::Scanner::TokenDesc::number_kind
NumberKind number_kind
Definition scanner.h:470

v8::internal::Scanner::TokenDesc::literal_chars
LiteralBuffer literal_chars
Definition scanner.h:465

v8::internal::Scanner::TokenDesc::invalid_template_escape_message
MessageTemplate invalid_template_escape_message
Definition scanner.h:468

v8::internal::Scanner::TokenDesc::raw_literal_chars
LiteralBuffer raw_literal_chars
Definition scanner.h:466

v8::internal::Scanner::TokenDesc::after_line_terminator
bool after_line_terminator
Definition scanner.h:472

V8_LIKELY
#define V8_LIKELY(condition)
Definition v8config.h:661

V8_UNLIKELY
#define V8_UNLIKELY(condition)
Definition v8config.h:660

vlq-base64.h

zone.h