From 75f478204a13f0fe250d841b0223227872339c4e Mon Sep 17 00:00:00 2001
From: Josh Holtrop <jholtrop@gmail.com>
Date: Sun, 9 Jul 2023 22:22:50 -0400
Subject: [PATCH] Replace Token struct with integer type

Replace _TOKEN_COUNT with INVALID_TOKEN_ID.
---
 assets/parser.d.erb    | 62 +++++++++++-------------------------------
 lib/propane/grammar.rb |  4 +++
 lib/propane/parser.rb  |  2 +-
 3 files changed, 21 insertions(+), 47 deletions(-)

diff --git a/assets/parser.d.erb b/assets/parser.d.erb
index 14aa6c7..aee77dd 100644
--- a/assets/parser.d.erb
+++ b/assets/parser.d.erb
@@ -26,9 +26,9 @@ class <%= @classname %>
     /* An invalid ID value. */
     private enum INVALID_ID = 0xFFFF_FFFFu;
 
-    alias TokenID = uint;
+    alias Token = <%= get_type_for(@grammar.invalid_token_id) %>;
 
-    enum : TokenID
+    enum : Token
     {
 <% @grammar.tokens.each_with_index do |token, index| %>
         TOKEN_<%= token.code_name %> = <%= index %>,
@@ -36,37 +36,7 @@ class <%= @classname %>
 <%     raise "Token ID (#{token.id}) does not match index (#{index}) for token #{token.name}!" %>
 <%   end %>
 <% end %>
-        _TOKEN_COUNT = <%= @grammar.tokens.size %>,
-    }
-
-    struct Token
-    {
-        /* Number of tokens in this parser. */
-        enum count = <%= @grammar.tokens.size %>;
-        TokenID token;
-        alias token this;
-
-        @disable this();
-
-        this(TokenID token)
-        {
-            this.token = token;
-        }
-
-        static Token invalid()
-        {
-            return Token(count);
-        }
-
-        bool is_valid() const
-        {
-            return token < count;
-        }
-
-        bool is_invalid() const
-        {
-            return !is_valid();
-        }
+        INVALID_TOKEN_ID = <%= @grammar.invalid_token_id %>,
     }
 
     alias CodePoint = uint;
@@ -207,7 +177,7 @@ class <%= @classname %>
 <%   if state_table_entry[:token] %>
                   Token(<%= state_table_entry[:token] %>u),
 <%   else %>
-                  Token.invalid(),
+                  INVALID_TOKEN_ID,
 <%   end %>
 <%   if state_table_entry[:code_id] %>
                   <%= state_table_entry[:code_id] %>u,
@@ -289,7 +259,7 @@ class <%= @classname %>
             default: break;
             }
 
-            return Token.invalid();
+            return INVALID_TOKEN_ID;
         }
 
         /**
@@ -306,7 +276,7 @@ class <%= @classname %>
             TokenInfo token_info;
             token_info.row = m_input_row;
             token_info.col = m_input_col;
-            token_info.token = _TOKEN_COUNT;
+            token_info.token = INVALID_TOKEN_ID;
             *out_token_info = token_info; // TODO: remove
             MatchInfo match_info;
             size_t unexpected_input_length;
@@ -322,9 +292,9 @@ class <%= @classname %>
                      * code did not explicitly return a token. So only override
                      * the token to return if the user code does explicitly
                      * return a token. */
-                    if (user_code_token.is_valid())
+                    if (user_code_token != INVALID_TOKEN_ID)
                     {
-                        token_to_accept = user_code_token.token;
+                        token_to_accept = user_code_token;
                     }
                 }
 
@@ -339,7 +309,7 @@ class <%= @classname %>
                 {
                     m_input_col += match_info.delta_col;
                 }
-                if (token_to_accept == _TOKEN_COUNT)
+                if (token_to_accept == INVALID_TOKEN_ID)
                 {
                     return P_DROP;
                 }
@@ -530,13 +500,13 @@ class <%= @classname %>
         size_t parse()
         {
             Lexer.TokenInfo token_info;
-            uint token = _TOKEN_COUNT;
+            uint token = INVALID_TOKEN_ID;
             StateValue[] statevalues = new StateValue[](1);
             uint reduced_rule_set = INVALID_ID;
             ParserValue reduced_parser_value;
             for (;;)
             {
-                if (token == _TOKEN_COUNT)
+                if (token == INVALID_TOKEN_ID)
                 {
                     size_t lexer_result = m_lexer.lex_token(&token_info);
                     if (lexer_result != P_TOKEN)
@@ -567,7 +537,7 @@ class <%= @classname %>
                     if (reduced_rule_set == INVALID_ID)
                     {
                         /* We shifted a token, mark it consumed. */
-                        token = _TOKEN_COUNT;
+                        token = INVALID_TOKEN_ID;
                         statevalues[$-1].pvalue = token_info.pvalue;
                     }
                     else
@@ -593,7 +563,7 @@ class <%= @classname %>
 
                 /* Error, unexpected token. */
                 write("Unexpected token ");
-                if (token < _TOKEN_COUNT)
+                if (token != INVALID_TOKEN_ID)
                 {
                     writeln(token_names[token]);
                 }
@@ -618,7 +588,7 @@ class <%= @classname %>
             {
                 if (shifts[i].symbol == symbol)
                 {
-//                    if (symbol < _TOKEN_COUNT)
+//                    if (symbol != INVALID_TOKEN_ID)
 //                    {
 //                        writeln("Shifting ", token_names[symbol]);
 //                    }
@@ -639,10 +609,10 @@ class <%= @classname %>
             for (uint i = start; i < end; i++)
             {
                 if ((reduces[i].token == token) ||
-                    (reduces[i].token == _TOKEN_COUNT))
+                    (reduces[i].token == INVALID_TOKEN_ID))
                 {
 //                    write("Reducing rule ", reduces[i].rule, ", rule set ", reduces[i].rule_set, " lookahead ");
-//                    if (token < _TOKEN_COUNT)
+//                    if (token != INVALID_TOKEN_ID)
 //                    {
 //                        writeln(token_names[token]);
 //                    }
diff --git a/lib/propane/grammar.rb b/lib/propane/grammar.rb
index 8b8f765..f91983f 100644
--- a/lib/propane/grammar.rb
+++ b/lib/propane/grammar.rb
@@ -30,6 +30,10 @@ class Propane
       @ptypes["default"]
     end
 
+    def invalid_token_id
+      @tokens.size
+    end
+
     private
 
     def parse_grammar!
diff --git a/lib/propane/parser.rb b/lib/propane/parser.rb
index af5f1f5..bfd6245 100644
--- a/lib/propane/parser.rb
+++ b/lib/propane/parser.rb
@@ -62,7 +62,7 @@ class Propane
         reduce_entries =
           case ra = item_set.reduce_actions
           when Rule
-            [{token_id: @grammar.tokens.size, rule_id: ra.id,
+            [{token_id: @grammar.invalid_token_id, rule_id: ra.id,
               rule_set_id: ra.rule_set.id, n_states: ra.components.size}]
           when Hash
             ra.map do |token, rule|