SquidDev
diff --git a/‎src/parser/illuaminateParser.ml‎
Lines changed: 52 additions & 48 deletions b/‎src/parser/illuaminateParser.ml‎
Lines changed: 52 additions & 48 deletions
diff --git a/‎src/parser/illuaminateParser.mli‎
Lines changed: 1 addition & 1 deletion b/‎src/parser/illuaminateParser.mli‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/parser/lexer.mll‎
Lines changed: 62 additions & 62 deletions b/‎src/parser/lexer.mll‎
Lines changed: 62 additions & 62 deletions
@@ -3,53 +3,38 @@ module I = Grammar.MenhirInterpreter
 module PE = Lrgrep_runtime.Interpreter (Parse_errors.Table_error_message) (I)
 module Error = Error
 
-type 'a located =
-  { span : Span.t;
-    start : Lexing.position;
-    finish : Lexing.position;
-    token : 'a
-  }
+type located_token = Token.lexer_token * Lexing.position * Lexing.position
 
-let lex_one lines (lexbuf : Lexing.lexbuf) =
+let lex_one lines (lexbuf : Lexing.lexbuf) : located_token =
   let start = lexbuf.lex_curr_p in
   let token = Lexer.token lines lexbuf in
   let finish = lexbuf.lex_curr_p in
-  { token; span = Span.of_pos2 lines start lexbuf.lex_curr_p; start; finish }
+  (token, start, finish)
 
-let lex_leading lines lexbuf =
-  let rec go xs =
-    match lex_one lines lexbuf with
-    | { token = Trivial value; span; _ } -> go ({ Span.value; span } :: xs)
-    | { token = Token token; _ } as rest -> (List.rev xs, { rest with token })
-  in
-  go []
+let rec lex_leading_worker lines (lexbuf : Lexing.lexbuf) xs =
+  let start = lexbuf.lex_curr_p in
+  match Lexer.token lines lexbuf with
+  | TRIVIA value ->
+      lex_leading_worker lines lexbuf
+        ({ Span.value; span = Span.of_pos2 lines start lexbuf.lex_curr_p } :: xs)
+  | token -> (List.rev xs, (token, start, lexbuf.lex_curr_p))
 
-let lex_trailing file lexbuf prev_line =
+let lex_leading lines lexbuf (token : located_token) =
+  match token with
+  | TRIVIA value, start, finish ->
+      lex_leading_worker lines lexbuf [ { Span.value; span = Span.of_pos2 lines start finish } ]
+  | tok -> ([], tok)
+
+let lex_trailing lines (lexbuf : Lexing.lexbuf) prev_line =
   let rec go xs =
-    match lex_one file lexbuf with
-    | { token = Trivial value; span; start; _ } when start.pos_lnum = prev_line ->
-        go ({ Span.value; span } :: xs)
-    | t -> (List.rev xs, t)
+    let start = lexbuf.lex_curr_p in
+    match Lexer.token lines lexbuf with
+    | TRIVIA value when start.pos_lnum = prev_line ->
+        go ({ Span.value; span = Span.of_pos2 lines start lexbuf.lex_curr_p } :: xs)
+    | t -> (List.rev xs, (t, start, lexbuf.lex_curr_p))
   in
   go []
 
-let lex_token file lexbuf (next : Token.lexer_token located) =
-  let leading, { token; span = tok_span; start; finish } =
-    match next with
-    | { token = Trivial value; span; _ } ->
-        let leading, t = lex_leading file lexbuf in
-        ({ Span.value; span } :: leading, t)
-    | { token = Token token; _ } as rest -> ([], { rest with token })
-  in
-  match token with
-  | EoF ->
-      (* Just return the current "next" token (we won't inspect it after all, and an EOF token with
-         no trailing data. *)
-      (Token.make_token leading [] tok_span token, start, finish, next)
-  | _ ->
-      let trailing, next = lex_trailing file lexbuf start.pos_lnum in
-      (Token.make_token leading trailing tok_span token, start, finish, next)
-
 let get_error_message token ~pre_env ~post_env : Error.message =
   match
     PE.run pre_env
@@ -68,18 +53,29 @@ let get_error_message token ~pre_env ~post_env : Error.message =
 let parse start (file : Illuaminate.File_id.t) (lexbuf : Lexing.lexbuf) =
   Span.Lines.using file lexbuf @@ fun lines ->
   let position_map = Span.Lines.position_map lines in
-  let rec go env token token_start token_end next = function
+  let rec go env token next = function
     | I.InputNeeded env as checkpoint -> go_input env checkpoint next
-    | (I.Shifting _ | I.AboutToReduce _) as checkpoint ->
-        I.resume checkpoint |> go env token token_start token_end next
+    | (I.Shifting _ | I.AboutToReduce _) as checkpoint -> I.resume checkpoint |> go env token next
     | I.HandlingError post_env ->
-        let message = get_error_message (token, token_start, token_end) ~pre_env:env ~post_env in
+        let message = get_error_message token ~pre_env:env ~post_env in
         Error { Error.file; position_map; message }
     | I.Accepted x -> Ok x
     | I.Rejected -> assert false
   and go_input env checkpoint token =
-    let token, start, finish, next = lex_token lines lexbuf token in
-    I.offer checkpoint (token, start, finish) |> go env token start finish next
+    let leading_trivia, ((token, start, finish) as lex_token) = lex_leading lines lexbuf token in
+    let span = Span.of_pos2 lines start lexbuf.lex_curr_p in
+    let token, next =
+      match token with
+      | EOF ->
+          (* Just return the current "next" token (we won't inspect it after all, and an EOF token
+             with no trailing data. *)
+          ( (Token.make_token ~leading_trivia ~trailing_trivia:[] ~span token, start, finish),
+            lex_token )
+      | _ ->
+          let trailing_trivia, next = lex_trailing lines lexbuf start.pos_lnum in
+          ((Token.make_token ~leading_trivia ~trailing_trivia ~span token, start, finish), next)
+    in
+    I.offer checkpoint token |> go env token next
   in
   try
     match start Lexing.dummy_pos with
@@ -91,18 +87,26 @@ let program = parse Grammar.Incremental.program
 let repl_exprs = parse Grammar.Incremental.repl_exprs
 
 module Lexer = struct
-  type token = Token.lexer_token =
-    | Token of IlluaminateCore.Token.t
+  type token =
+    | Token of string
     | Trivial of IlluaminateCore.Node.trivial
 
   let lex (file : Illuaminate.File_id.t) (lexbuf : Lexing.lexbuf) =
     Span.Lines.using file lexbuf @@ fun lines ->
     try
       let rec go xs =
-        let { token; span; _ } = lex_one lines lexbuf in
-        let xs = { Span.value = token; span } :: xs in
+        let token, start, finish = lex_one lines lexbuf in
+        let span = Span.of_pos2 lines start finish in
+        let value =
+          match token with
+          | TRIVIA t -> Trivial t
+          | t ->
+              Token
+                (Token.make_token ~leading_trivia:[] ~trailing_trivia:[] ~span t |> Token.to_string)
+        in
+        let xs = { Span.value; span } :: xs in
         match token with
-        | Token EoF -> xs
+        | EOF -> xs
         | _ -> go xs
       in
       go [] |> List.rev |> Array.of_list |> Result.ok
 
@@ -4,7 +4,7 @@ module Error = Error
 module Lexer : sig
   (** The type of tokens produced by the lexer. *)
   type token =
-    | Token of IlluaminateCore.Token.t
+    | Token of string
     | Trivial of IlluaminateCore.Node.trivial
 
   (** Lex a file, producing a simple token stream. *)
 
@@ -29,8 +29,8 @@
     Buffer.add_string b str;
     b
 
-  let mk_long_comment c = Trivial (BlockComment c)
-  let mk_long_string c = Token (String c)
+  let mk_long_comment c = TRIVIA (BlockComment c)
+  let mk_long_string c = STRING c
 }
 
 let white = [' ' '\t']
@@ -44,85 +44,85 @@ let ident_head = ['a'-'z' 'A'-'Z' '_']
 let ident_tail = ident_head | '_' | digit
 
 rule token l = parse
-| white+ as x           { Trivial (Whitespace x) }
-| '\n'                  { new_line l; Trivial (Whitespace "\n") }
-| '\r' '\n'             { new_line l; Trivial (Whitespace "\r\n") }
+| white+ as x           { TRIVIA (Whitespace x) }
+| '\n'                  { new_line l; TRIVIA (Whitespace "\n") }
+| '\r' '\n'             { new_line l; TRIVIA (Whitespace "\r\n") }
 | ("--[" '='* '[') as x { long_string (buffer_with' 16 x) (String.length x - 4) mk_long_comment l lexbuf }
 (* We split line comments into two parts. Otherwise "--[^\n]*" would match "--[[foo]]". *)
 | "--"                  { line_comment lexbuf }
 
-| "and"      { Token And      }
-| "break"    { Token Break    }
-| "do"       { Token Do       }
-| "else"     { Token Else     }
-| "elseif"   { Token ElseIf   }
-| "end"      { Token End      }
-| "false"    { Token False    }
-| "for"      { Token For      }
-| "function" { Token Function }
-| "if"       { Token If       }
-| "in"       { Token In       }
-| "local"    { Token Local    }
-| "nil"      { Token Nil      }
-| "not"      { Token Not      }
-| "or"       { Token Or       }
-| "repeat"   { Token Repeat   }
-| "return"   { Token Return   }
-| "then"     { Token Then     }
-| "true"     { Token True     }
-| "until"    { Token Until    }
-| "while"    { Token While    }
-
-| ":"        { Token Colon }
-| "::"       { Token Double_colon }
-| ","        { Token Comma }
-| "."        { Token Dot }
-| "..."      { Token Dots }
-| "="        { Token Equals }
-| ";"        { Token Semicolon }
-
-| '(' { Token OParen }  | ')' { Token CParen }
-| '{' { Token OBrace }  | '}' { Token CBrace }
-| '[' { Token OSquare } | ']' { Token CSquare }
-
-| '+'  { Token Add }
-| '-'  { Token Sub }
-| '*'  { Token Mul }
-| '/'  { Token Div }
-| '^'  { Token Pow }
-| '%'  { Token Mod }
-| ".." { Token Concat }
-| "==" { Token Eq }
-| "~=" { Token Ne }
-| "<"  { Token Lt }
-| "<=" { Token Le }
-| ">"  { Token Gt }
-| ">=" { Token Ge }
-| '#'  { Token Len }
+| "and"      { AND      }
+| "break"    { BREAK    }
+| "do"       { DO       }
+| "else"     { ELSE     }
+| "elseif"   { ELSEIF   }
+| "end"      { END      }
+| "false"    { FALSE    }
+| "for"      { FOR      }
+| "function" { FUNCTION }
+| "if"       { IF       }
+| "in"       { IN       }
+| "local"    { LOCAL    }
+| "nil"      { NIL      }
+| "not"      { NOT      }
+| "or"       { OR       }
+| "repeat"   { REPEAT   }
+| "return"   { RETURN   }
+| "then"     { THEN     }
+| "true"     { TRUE     }
+| "until"    { UNTIL    }
+| "while"    { WHILE    }
+
+| ":"        { COLON }
+| "::"       { DOUBLE_COLON }
+| ","        { COMMA }
+| "."        { DOT }
+| "..."      { DOTS }
+| "="        { EQUALS }
+| ";"        { SEMICOLON }
+
+| '(' { OPAREN }  | ')' { CPAREN }
+| '{' { OBRACE }  | '}' { CBRACE }
+| '[' { OSQUARE } | ']' { CSQUARE }
+
+| '+'  { ADD }
+| '-'  { SUB }
+| '*'  { MUL }
+| '/'  { DIV }
+| '^'  { POW }
+| '%'  { MOD }
+| ".." { CONCAT }
+| "==" { EQ }
+| "~=" { NE }
+| "<"  { LT }
+| "<=" { LE }
+| ">"  { GT }
+| ">=" { GE }
+| '#'  { LEN }
 
 (* Numbers *)
-| "0x" hex+ as i         { Token (Number i) }
-| digit+ as i            { Token (Number i) }
-| digit number* as i     { Token (Number i) }
-| '.' digit number* as i { Token (Number i) }
+| "0x" hex+ as i         { NUMBER i }
+| digit+ as i            { NUMBER i }
+| digit number* as i     { NUMBER i }
+| '.' digit number* as i { NUMBER i }
 
 (* Identifiers *)
-| ident_head ident_tail* as i { Token (Ident i) }
+| ident_head ident_tail* as i { IDENT i }
 
 | '\"'          { string (buffer_with 17 '\"') '\"' lexbuf }
 | '\''          { string (buffer_with 17 '\'') '\'' lexbuf }
 | ('[' '='* '[') as x { long_string (buffer_with' 16 x) (String.length x - 2) mk_long_string l lexbuf }
 
-| eof { Token EoF }
+| eof { EOF }
 
 | _ { unexpected_character lexbuf }
 
 and string contents c = parse
 | '\"'              { Buffer.add_char contents '\"';
-                      if c = '\"' then Token (String (Buffer.contents contents))
+                      if c = '\"' then STRING (Buffer.contents contents)
                       else string contents c lexbuf }
 | '\''              { Buffer.add_char contents '\'';
-                      if c = '\'' then Token (String (Buffer.contents contents))
+                      if c = '\'' then STRING (Buffer.contents contents)
                       else string contents c lexbuf }
 
 | "\\a"             { Buffer.add_string contents "\\a"; string contents c lexbuf }
@@ -168,4 +168,4 @@ and long_string buf eqs term l = parse
 | eof                    { unterminated_string ~eol:false lexbuf }
 
 and line_comment = parse
-| [^'\r' '\n']* as x     { Trivial (LineComment ("--" ^ x)) }
+| [^'\r' '\n']* as x     { TRIVIA (LineComment ("--" ^ x)) }