Merge pull request #72 from Strumenta/bugfix/localized-issues

alessiostalla · web-flow · commit c2db2d8bfdf7 · 2024-06-20T11:41:08.000+02:00
Differentiating between several parser and lexer issues
diff --git a/src/parsing/tylasu-parser.ts b/src/parsing/tylasu-parser.ts
@@ -68,6 +68,8 @@ export class ANTLRTokenFactory extends TokenFactory<TylasuANTLRToken> {
 }
 
 export const SYNTAX_ERROR = "parser.syntaxError";
+export const MISMATCHED_INPUT = "parser.mismatchedinput";
+export const TOKEN_RECOGNITION_ERROR = "lexer.tokenrecognitionerror"
 export const INPUT_NOT_FULLY_CONSUMED = "parser.inputNotFullyConsumed";
 export const ERROR_NODE_FOUND = "parser.errorNodeFound";
 
@@ -118,13 +120,31 @@ export abstract class TylasuANTLRLexer<T extends TylasuToken> implements TylasuL
             reportAttemptingFullContext() {},
             reportContextSensitivity() {},
             syntaxError<S extends Token, T extends ATNSimulator>(recognizer: Recognizer<T>, offendingSymbol: S | null, line: number, charPositionInLine: number, msg: string) {
-                issues.push(
-                    Issue.lexical(
-                        msg || "unspecified",
-                        IssueSeverity.ERROR,
-                        Position.ofPoint(new Point(line, charPositionInLine)),
-                        undefined,
-                        SYNTAX_ERROR));
+                const regex = /token recognition error at: '(.+)'/
+                if (regex.test(msg)){
+                    const match = msg.match(regex) as string[];
+                    issues.push(
+                        Issue.lexical(
+                            msg || "unspecified",
+                            IssueSeverity.ERROR,
+                            Position.ofPoint(new Point(line, charPositionInLine)),
+                            undefined,
+                            TOKEN_RECOGNITION_ERROR,
+                            [
+                                {
+                                    name: "token",
+                                    value: match[1]
+                                }
+                            ]));
+                } else {
+                    issues.push(
+                        Issue.lexical(
+                            msg || "unspecified",
+                            IssueSeverity.ERROR,
+                            Position.ofPoint(new Point(line, charPositionInLine)),
+                            undefined,
+                            SYNTAX_ERROR));
+                }
             }
         });
     }
@@ -281,13 +301,34 @@ export abstract class TylasuParser<
             reportAttemptingFullContext() {},
             reportContextSensitivity() {},
             syntaxError<S extends Token, T extends ATNSimulator>(recognizer: Recognizer<T>, offendingSymbol: S | null, line: number, charPositionInLine: number, msg: string) {
-                issues.push(
-                    Issue.syntactic(
-                        msg || "unspecified",
-                        IssueSeverity.ERROR,
-                        Position.ofPoint(new Point(line, charPositionInLine)),
-                        undefined,
-                        SYNTAX_ERROR));
+                const mismatchedRegex = /^mismatched input '(<EOF>|.+)' expecting {([a-zA-Z_]+(, [a-zA-Z_]+)*)}$/
+                if (mismatchedRegex.test(msg)) {
+                    const match = msg.match(mismatchedRegex) as string[];
+                    const args = [{
+                        name: "mismatched",
+                        value: match[1]
+                    }];
+                    match[2].split(", ").forEach((expected)=>args.push({
+                        name: "expected",
+                        value: expected
+                    }))
+                    issues.push(
+                        Issue.syntactic(
+                            msg,
+                            IssueSeverity.ERROR,
+                            Position.ofPoint(new Point(line, charPositionInLine)),
+                            undefined,
+                            MISMATCHED_INPUT,
+                            args));
+                } else {
+                    issues.push(
+                        Issue.syntactic(
+                            msg || "unspecified",
+                            IssueSeverity.ERROR,
+                            Position.ofPoint(new Point(line, charPositionInLine)),
+                            undefined,
+                            SYNTAX_ERROR));
+                }
             }
         });
     }
diff --git a/tests/parsing.test.ts b/tests/parsing.test.ts
@@ -1,6 +1,6 @@
 import {expect} from "chai";
 
-import {Issue, Node} from "../src";
+import {Issue, IssueSeverity, IssueType, Node, Point, Position} from "../src";
 import {SimpleLangLexer} from "./parser/SimpleLangLexer";
 import {CharStream, Lexer, TokenStream} from "antlr4ng";
 import {CompilationUnitContext, SimpleLangParser} from "./parser/SimpleLangParser";
@@ -36,4 +36,193 @@ describe('Parsing', function() {
             expect(result.root!.parseTree).to.equal(result.firstStage!.root);
             expect(result.code).to.equal(code);
         });
+    it("produce correct issues for: display 1 +",
+        function () {
+            const code = "display 1 +";
+            const parser = new SLParser(new ANTLRTokenFactory());
+            const result = parser.parse(code);
+            expect(result.issues).to.eql([new Issue(
+                IssueType.SYNTACTIC,
+                "mismatched input '<EOF>' expecting {INT_LIT, DEC_LIT, STRING_LIT, BOOLEAN_LIT}",
+                IssueSeverity.ERROR,
+                new Position(new Point(1, 11), new Point(1, 11)),
+                undefined,
+                "parser.mismatchedinput",
+                [
+                    {
+                        name: "mismatched",
+                        value: "<EOF>"
+                    },
+                    {
+                    name: "expected",
+                    value: "INT_LIT"
+                    },
+                    {
+                        name: "expected",
+                        value: "DEC_LIT"
+                    },
+                    {
+                        name: "expected",
+                        value: "STRING_LIT"
+                    },
+                    {
+                        name: "expected",
+                        value: "BOOLEAN_LIT"
+                    }
+                ]
+            )])
+        });
+    it("produce correct issues for: display 1 ++",
+        function () {
+            const code = "display 1 ++";
+            const parser = new SLParser(new ANTLRTokenFactory());
+            const result = parser.parse(code);
+            expect(result.issues).to.eql([
+                new Issue(
+                    IssueType.SYNTACTIC,
+                    "mismatched input '+' expecting {INT_LIT, DEC_LIT, STRING_LIT, BOOLEAN_LIT}",
+                    IssueSeverity.ERROR,
+                    new Position(new Point(1, 11), new Point(1, 11)),
+                    undefined,
+                    "parser.mismatchedinput",
+                    [
+                        {
+                            name: "mismatched",
+                            value: "+"
+                        },
+                        {
+                            name: "expected",
+                            value: "INT_LIT"
+                        },
+                        {
+                            name: "expected",
+                            value: "DEC_LIT"
+                        },
+                        {
+                            name: "expected",
+                            value: "STRING_LIT"
+                        },
+                        {
+                            name: "expected",
+                            value: "BOOLEAN_LIT"
+                        }
+                    ]
+                ),
+                new Issue(
+                IssueType.SYNTACTIC,
+                "mismatched input '<EOF>' expecting {INT_LIT, DEC_LIT, STRING_LIT, BOOLEAN_LIT}",
+                IssueSeverity.ERROR,
+                new Position(new Point(1, 12), new Point(1, 12)),
+                undefined,
+                "parser.mismatchedinput",
+                [
+                    {
+                        name: "mismatched",
+                        value: "<EOF>"
+                    },
+                    {
+                        name: "expected",
+                        value: "INT_LIT"
+                    },
+                    {
+                        name: "expected",
+                        value: "DEC_LIT"
+                    },
+                    {
+                        name: "expected",
+                        value: "STRING_LIT"
+                    },
+                    {
+                        name: "expected",
+                        value: "BOOLEAN_LIT"
+                    }
+                ]
+            )])
+        });
+    it("produce correct issues for: display",
+        function () {
+            const code = "display";
+            const parser = new SLParser(new ANTLRTokenFactory());
+            const result = parser.parse(code);
+            expect(result.issues).to.eql([
+                new Issue(
+                    IssueType.SYNTACTIC,
+                    "mismatched input '<EOF>' expecting {INT_LIT, DEC_LIT, STRING_LIT, BOOLEAN_LIT}",
+                    IssueSeverity.ERROR,
+                    new Position(new Point(1, 7), new Point(1, 7)),
+                    undefined,
+                    "parser.mismatchedinput",
+                    [
+                        {
+                            name: "mismatched",
+                            value: "<EOF>"
+                        },
+                        {
+                            name: "expected",
+                            value: "INT_LIT"
+                        },
+                        {
+                            name: "expected",
+                            value: "DEC_LIT"
+                        },
+                        {
+                            name: "expected",
+                            value: "STRING_LIT"
+                        },
+                        {
+                            name: "expected",
+                            value: "BOOLEAN_LIT"
+                        }
+                    ]
+                )])
+        });
+    it("produce correct issues for: ###",
+        function () {
+            const code = "###";
+            const parser = new SLParser(new ANTLRTokenFactory());
+            const result = parser.parse(code);
+            expect(result.issues).to.eql([
+                new Issue(
+                    IssueType.LEXICAL,
+                    "token recognition error at: '#'",
+                    IssueSeverity.ERROR,
+                    new Position(new Point(1, 0), new Point(1, 0)),
+                    undefined,
+                    "lexer.tokenrecognitionerror",
+                    [
+                        {
+                            name: "token",
+                            value: "#"
+                        }
+                    ]
+                ),
+                new Issue(
+                    IssueType.LEXICAL,
+                    "token recognition error at: '#'",
+                    IssueSeverity.ERROR,
+                    new Position(new Point(1, 1), new Point(1, 1)),
+                    undefined,
+                    "lexer.tokenrecognitionerror",
+                    [
+                        {
+                            name: "token",
+                            value: "#"
+                        }
+                    ]
+                ),
+                new Issue(
+                    IssueType.LEXICAL,
+                    "token recognition error at: '#'",
+                    IssueSeverity.ERROR,
+                    new Position(new Point(1, 2), new Point(1, 2)),
+                    undefined,
+                    "lexer.tokenrecognitionerror",
+                    [
+                        {
+                            name: "token",
+                            value: "#"
+                        }
+                    ]
+                )])
+        })
 });