[Parser] Do not eagerly lex IDs (#6542)

Lex them on demand instead to avoid wasted work.
author: Thomas Lively <tlively@google.com> 2024-04-25 21:50:47 -0700
committer: GitHub <noreply@github.com> 2024-04-25 21:50:47 -0700
commit: 003786cb6aede99cf3d188771a27de8e26b555cf (patch)
tree: 3f2b9380ecc183fa47e55cef8c18ae7c87d8a782 /src/parser/lexer.cpp
parent: eccf9f951262bf6909bf75e8865e09d0596dcc09 (diff)
download: binaryen-003786cb6aede99cf3d188771a27de8e26b555cf.tar.gz
binaryen-003786cb6aede99cf3d188771a27de8e26b555cf.tar.bz2
binaryen-003786cb6aede99cf3d188771a27de8e26b555cf.zip
1 files changed, 21 insertions, 20 deletions
diff --git a/src/parser/lexer.cpp b/src/parser/lexer.cpp
index 464cd34c4..8384b5047 100644
--- a/src/parser/lexer.cpp
+++ b/src/parser/lexer.cpp
@@ -1015,21 +1015,6 @@ std::optional<std::string_view> Token::getString() const {
   return {};
 }
 
-std::optional<std::string_view> Token::getID() const {
-  if (auto* tok = std::get_if<IdTok>(&data)) {
-    if (tok->str) {
-      return std::string_view(*tok->str);
-    }
-    if (tok->isStr) {
-      // Remove '$' and quotes.
-      return span.substr(2, span.size() - 3);
-    }
-    // Remove '$'.
-    return span.substr(1);
-  }
-  return {};
-}
-
 void Lexer::skipSpace() {
   while (true) {
     if (auto ctx = annotation(next())) {
@@ -1069,6 +1054,26 @@ bool Lexer::takeRParen() {
   return false;
 }
 
+std::optional<Name> Lexer::takeID() {
+  if (curr) {
+    return std::nullopt;
+  }
+  if (auto result = ident(next())) {
+    index += result->span.size();
+    advance();
+    if (result->str) {
+      return Name(*result->str);
+    }
+    if (result->isStr) {
+      // Remove '$' and quotes.
+      return Name(result->span.substr(2, result->span.size() - 3));
+    }
+    // Remove '$'.
+    return Name(result->span.substr(1));
+  }
+  return std::nullopt;
+}
+
 std::optional<std::string_view> Lexer::takeKeyword() {
   if (curr) {
     return std::nullopt;
@@ -1123,9 +1128,7 @@ std::optional<uint32_t> Lexer::takeAlign() {
 void Lexer::lexToken() {
   // TODO: Ensure we're getting the longest possible match.
   Token tok;
-  if (auto t = ident(next())) {
-    tok = Token{t->span, IdTok{t->isStr, t->str}};
-  } else if (auto t = integer(next())) {
+  if (auto t = integer(next())) {
     tok = Token{t->span, IntTok{t->n, t->sign}};
   } else if (auto t = float_(next())) {
     tok = Token{t->span, FloatTok{t->nanPayload, t->d}};
@@ -1186,8 +1189,6 @@ std::ostream& operator<<(std::ostream& os, const TextPos& pos) {
   return os << pos.line << ":" << pos.col;
 }
 
-std::ostream& operator<<(std::ostream& os, const IdTok&) { return os << "id"; }
-
 std::ostream& operator<<(std::ostream& os, const IntTok& tok) {
   return os << (tok.sign == Pos ? "+" : tok.sign == Neg ? "-" : "") << tok.n;
 }
author	Thomas Lively <tlively@google.com>	2024-04-25 21:50:47 -0700
committer	GitHub <noreply@github.com>	2024-04-25 21:50:47 -0700
commit	003786cb6aede99cf3d188771a27de8e26b555cf (patch)
tree	3f2b9380ecc183fa47e55cef8c18ae7c87d8a782 /src/parser/lexer.cpp
parent	eccf9f951262bf6909bf75e8865e09d0596dcc09 (diff)
download	binaryen-003786cb6aede99cf3d188771a27de8e26b555cf.tar.gz binaryen-003786cb6aede99cf3d188771a27de8e26b555cf.tar.bz2 binaryen-003786cb6aede99cf3d188771a27de8e26b555cf.zip